词法分析器就是通过扫描一段程序判断是否是关键字、标识符、常数、分界符、运算符。一般分为一符一种和经典五中;
这里我用的是经典五中,此词法分析器是用c++编写的;
/*
保留字|关键字:1
操作符|运算符:2
分界符:3
标识符:4
常数:5
无识别:6
*/
主要代码为:
#include<iostream>
using namespace std;
#define MAX 10
/*
保留字|关键字:1
操作符|运算符:2
分界符:3
标识符:4
常数:5
无识别:6
*/
char ch = ' ';
char* keyWord[10] = {"void","main","break","include","begin","end","if","else","while","switch"};
char token[20];//定义获取的字符
//判断是否是关键字
bool isKey(char * token)
{
for(int i = 0;i < MAX;i++)
{
if(strcmp(token,keyWord[i]) == 0)
return true;
}
return false;
}
//判断是否是字母
bool isLetter(char letter)
{
if((letter >= 'a' && letter <= 'z')||(letter >= 'A' && letter <= 'Z'))
return true;
else
return false;
}
//判断是否是数字
bool isDigit(char digit)
{
if(digit >= '0' && digit <= '9')
return true;
else
return false;
}
//词法分析
void analyze(FILE *fpin)
{
while((ch = fgetc(fpin)) != EOF){
if(ch == ' '||ch == ' '||ch == '
'){}
else if(isLetter(ch)){
char token[20]={' '};
int i=0;
while(isLetter(ch)||isDigit(ch)){
token[i] = ch;
i++;
ch = fgetc(fpin);
}
//回退一个指针
fseek(fpin,-1L,SEEK_CUR);
if(isKey(token)){
//关键字
cout<<token<<" 1"<<" 关键字"<<endl;
}
else{
//标识符
cout<<token<<" 4"<<" 标识符"<<endl;
}
}
else if(isDigit(ch)||(ch == '.'))
{
int i=0;
char token[20]={' '};
while(isDigit(ch)||(ch == '.'&&isDigit(fgetc(fpin))))
{
if(ch == '.')fseek(fpin,-1L,SEEK_CUR);
token[i] = ch;
i++;
ch = fgetc(fpin);
}
fseek(fpin,-1L,SEEK_CUR);
//属于无符号常数
cout<<token<<" 5"<<" 常数"<<endl;
}
else switch(ch){
//运算符
case '+':{
ch = fgetc(fpin);
if(ch == '+')cout<<"++"<<" 2"<<" 运算符"<<endl;
else {
cout<<"+"<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
case '-':{
ch = fgetc(fpin);
if(ch == '-')cout<<"--"<<" 2"<<" 运算符"<<endl;
else {
cout<<"-"<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
case '*':cout<<ch<<" 2"<<" 运算符"<<endl;break;
case '/':cout<<ch<<" 2"<<" 运算符"<<endl;break;
//分界符
case '(':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case ')':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case '[':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case ']':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case ';':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case '{':cout<<ch<<" 3"<<" 分界符"<<endl;break;
case '}':cout<<ch<<" 3"<<" 分界符"<<endl;break;
//运算符
case '=':{
ch = fgetc(fpin);
if(ch == '=')cout<<"=="<<" 2"<<" 运算符"<<endl;
else {
cout<<"="<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
case ':':{
ch = fgetc(fpin);
if(ch == '=')cout<<":="<<" 2"<<" 运算符"<<endl;
else {
cout<<":"<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
case '>':{
ch = fgetc(fpin);
if(ch == '=')cout<<">="<<" 2"<<" 运算符"<<endl;
else {
cout<<">"<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
case '<':{
ch = fgetc(fpin);
if(ch == '=')cout<<"<="<<" 2"<<" 运算符"<<endl;
else {
cout<<"<"<<" 2"<<" 运算符"<<endl;
fseek(fpin,-1L,SEEK_CUR);
}
}break;
//无识别
default: cout<<ch<<" 6"<<" 无识别符"<<endl;
}
}
}
int main(){
char input[30];
FILE *fpin;
cout<<"请输入源文件名:
"<<endl;
for(;;){
cin>>input;
if((fpin = fopen(input,"r")) != NULL)
break;
else
cout<<"路径输入错误"<<endl;
}
cout<<"****************词法分析结果********************"<<endl;
analyze(fpin);
fclose(fpin);
}
运行结果:


