#include <iostream>
#include <string.h>
using namespace std;
char key[10][20] = {"begin","if","then","while","do","end","int","main","return","cout"};//定义一个二维数组存放关键字
char token[20]; //存放字符(单词)
//判断关键字
int isKey(char s[])
{
for(int i = 0; i<8;i++)
{
if(strcmp(s,key[i]) == 0)
{
return i+1; //关键字的种别码依次为 begin=1,if=2,then=3,while=4,do=5,end=6,int=7,main=8即为 i+1 的值
}
}
for(int i = 8; i<10;i++)
{
if(strcmp(s,key[i]) == 0)
{
return i+4; //关键字的种别码依次为 return=12,cout=13即为 i+4 的值
}
}
return -1;
}
//判断是不是字母
bool isChar(char ch)
{
if((ch>='a' && ch<='z') || (ch>='A' && ch<='Z'))
return true;
else return false;
}
//判断是不是数字
bool isNum(char ch)
{
if(ch>='0' && ch<='9')
return true;
else
return false;
}
//核心子程序
void scanner(int &identifier,int &p,char s[])
{
int count = 0;
if(s[p] == ' ') p++;
//开头是字母
if(isChar(s[p]))
{
while(isNum(s[p]) || isChar(s[p]))
{
token[count++] = s[p];
p++;
}
token[count] = '\0'; //'\0'作为结束符 ,将单词分隔开
identifier = isKey(token);
if(identifier == -1)
{
identifier = 10; //标识符letter(letter|digit)*
}
}
//开头是数字
else if(isNum(s[p]))
{
while(isNum(s[p]))
{
token[count++] = s[p];
p++;
}
token[count] = '\0';//结束标识
identifier = 11; //数字digit(digit) *
}
//如果是运算符或者界符
else
{
//先处理没有争议的字符
switch(s[p])
{
case '+': identifier = 22;token[0] = s[p];token[1]='\0';break;
case '-': identifier = 23;token[0] = s[p];token[1]='\0';break;
case '*': identifier = 24;token[0] = s[p];token[1]='\0';break;
case '/': identifier = 25;token[0] = s[p];token[1]='\0';break;
case '(': identifier = 26;token[0] = s[p];token[1]='\0';break;
case ')': identifier = 27;token[0] = s[p];token[1]='\0';break;
case '[': identifier = 28;token[0] = s[p];token[1]='\0';break;
case ']': identifier = 29;token[0] = s[p];token[1]='\0';break;
case '{': identifier = 30;token[0] = s[p];token[1]='\0';break;
case '}': identifier = 31;token[0] = s[p];token[1]='\0';break;
case ',': identifier = 32;token[0] = s[p];token[1]='\0';break;
case ':': identifier = 33;token[0] = s[p];token[1]='\0';break;
case ';': identifier = 34;token[0] = s[p];token[1]='\0';break;
case '>': identifier = 35;token[0] = s[p];token[1]='\0';break;
case '<': identifier = 36;token[0] = s[p];token[1]='\0';break;
case '"': identifier = 41;token[0] = s[p];token[1]='\0';break;
case '#': identifier = 0 ;token[0] = s[p];token[1]='\0';break;
case '!': identifier = -1;token[0] = s[p];token[1]='\0';break;
}
//处理有争议的
// :=
if(s[p] == ':')
{
token[count++] = s[p];
if(s[p+1] == '=')
{
p++;
token[count++] = s[p];
identifier = 18;
}
else
{
identifier = 33;
}
token[count] = '\0';
}
// <=
if(s[p] == '<')
{
token[count++] = s[p];
if(s[p+1] == '=')
{
p++;
identifier = 38;
}
else
{
identifier = 36;
}
token[count] = '\0';
}
// >=
if(s[p] == '>')
{
token[count++] = s[p];
if(s[p+1] == '=')
{
p++;
identifier = 37;
}
else
{
identifier = 35;
}
token[count] = '\0';
}
// ==
if((s[p] == '=')&&(s[p+1] == '='))
{
token[count++] = s[p];
p++;
token[count++] = s[p];
identifier = 21;
}
// /0
if(s[p] == '\\')
{
token[count++] = s[p];
if(s[p+1] == '0')
{
p++;
token[count++] = s[p];
identifier = 1000;
}
}
// !=
if(s[p] == '!')
{
token[count++] = s[p];
if(s[p+1] == '=')
{
p++;
token[count++] = s[p];
identifier = 40;
}
else
{
identifier = -1;
}
token[count] = '\0';
}
//后移
p++; //判断运算符和界符的这部分由于指针 p 没有向后指,所以需要将指针 p 向后移一位
}
}
int main()
{
char s[100]; //输入字符串
while(cin>>s)
{
int p = 0;
int identifier;
while(p < strlen(s)) //循环条件 ,p还未指到字符串最后
{
scanner(identifier,p,s);
cout<<'<'<<token<<','<<identifier<<'>'<<endl;
}
}
return 0;
}
04-22
1136