词法分析程序(Lexical Analyzer)要求:
- 从左至右扫描构成源程序的字符流
- 识别出有词法意义的单词(Lexemes)
- 返回单词记录(单词类别,单词本身)
- 滤掉空格
- 跳过注释
- 发现词法错误
程序结构:
输入:字符流(什么输入方式,什么数据结构保存)
处理:
–遍历(什么遍历方式)
–词法规则
输出:单词流(什么输出形式)
–二元组
单词类别:
1.标识符(10)
2.无符号数(11)
3.保留字(一词一码)
4.运算符(一词一码)
5.界符(一词一码)
单词符号 |
种别码 |
单词符号 |
种别码 |
begin |
1 |
: |
17 |
if |
2 |
:= |
18 |
then |
3 |
< |
20 |
while |
4 |
<= |
21 |
do |
5 |
<> |
22 |
end |
6 |
> |
23 |
l(l|d)* |
10 |
>= |
24 |
dd* |
11 |
= |
25 |
+ |
13 |
; |
26 |
- |
14 |
( |
27 |
* |
15 |
) |
28 |
/ |
16 |
# |
0 |
1 #include<stdio.h> 2 #include<string.h> 3 #include<stdlib.h> 4 char savearray[100],outarray[100]; 5 char ch; 6 int row,arrays,count,m,i,p;//count为计数器 p为指针 7 char *wordsymbol[6] = {"if", "begin", "then", "while", "do", "end"}; 8 void getarrays(){ 9 for(i = 0; i < 8; i++){ 10 outarray[i] == NULL; 11 } 12 ch = savearray[p++]; 13 while(ch == ' '){ 14 ch = savearray[p]; 15 p++; 16 } 17 18 if((ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <='Z')){ 19 m = 0; 20 while((ch <= '9' && ch>= '0') || (ch >= 'a' && ch <= 'z') || (ch >= 'A' && ch <= 'Z')){ 21 outarray[m++] = ch; 22 ch = savearray[p++]; 23 } 24 outarray[m++] = '\0'; 25 p--; 26 arrays = 10; 27 for(i = 0; i < 6; i++){ 28 if(strcmp(wordsymbol[i],outarray) == 0){ 29 arrays =1 + i; 30 break; 31 } 32 33 } 34 }else if(ch <= '9' && ch>= '0'){ 35 count = 0; 36 while(ch >= '0' && ch <='9'){ 37 count *= 10 + (ch - '0'); 38 ch = savearray[p++]; 39 } 40 p--; 41 arrays = 11; 42 } else switch(ch){ 43 case '+': 44 outarray[0] = ch; 45 arrays = 13; 46 return; 47 case '-': 48 outarray[0] = ch; 49 arrays = 14; 50 return; 51 case '*': 52 outarray[0] = ch; 53 arrays = 15; 54 break; 55 case '/': 56 outarray[0] = ch; 57 arrays = 16; 58 break; 59 case ':': 60 i = 0; 61 outarray[i++] = ch; 62 ch = savearray[p++]; 63 if(ch == '='){ 64 outarray[i++] = ch; 65 arrays = 18; 66 }else{ 67 arrays = 17; 68 p--; 69 } 70 return; 71 72 case '<': 73 i = 0; 74 outarray[i++] = ch; 75 ch = savearray[p++]; 76 if(ch == '='){ 77 outarray[i++] = ch; 78 arrays = 21; 79 80 }else if(ch == '='){ 81 outarray[i++] = ch; 82 arrays = 22; 83 }else{ 84 arrays = 20; 85 p--; 86 } 87 return; 88 case '>': 89 i = 0; 90 outarray[i++] = ch; 91 ch = savearray[p++]; 92 if(ch == '='){ 93 outarray[i++] = ch; 94 arrays = 24; 95 }else{ 96 arrays = 23; 97 p--; 98 } 99 return; 100 case '=': 101 outarray[0] = ch; 102 arrays = 25; 103 break; 104 case ';': 105 outarray[0] = ch; 106 arrays = 26; 107 break; 108 case '(': 109 outarray[0] = ch; 110 arrays = 27; 111 break; 112 case ')': 113 outarray[0] = ch; 114 arrays = 28; 115 break; 116 case '#': 117 outarray[0] = ch; 118 arrays = 0; 119 break; 120 case '\n': 121 arrays = 100; 122 break; 123 default: 124 arrays = -1; 125 } 126 } 127 int main(){ 128 int p = 0, 129 row = 1; 130 printf("输入测试语句:"); 131 do{ 132 ch = getchar(); 133 savearray[p++] = ch; 134 }while(ch != '#'); 135 136 p = 0; 137 do{ 138 getarrays(); 139 switch(arrays){ 140 case -1: 141 printf("第%d行有问题",row); 142 break; 143 case 100: 144 row += 1; 145 break; 146 case 11: 147 printf("(%d,%d)\n", count,arrays); 148 break; 149 default: 150 printf("(%s,%d)\n",outarray,arrays); 151 } 152 }while(arrays != 0); 153 } 154 155 156