词法分析
可识别内容:
标识符:id
数字:num
关键字:int,char,if,else,while,do,for
标号:, , . , ;
算术运算符号:=,+,-,*,/,&,!,|,&&,||
关系运算符:<,<=,>=,>,==,!=
注释://
内码定义:
单个符号,如{,+,*,> 等,均使用其ascii码做内码,占双或多个字节的符号(包括保留字,标号,数字,运算符等)为其取名如下:
Enum { END=0,INT,CHAR,IF,ELSE,WHILE=5,
DO,FOR,ARGAND,ARGOR,NUM=10,
ID,LESSEQUAL,EQUAL,GREATEQUAL,NOTEQUAL=15 };
其中NUM代表数字,ID代表标识符.
测试程序1-1的词法分析结果如下:
内码表
123 { 11 X 61 = 10 12 43 + 43 + 11 b 47 / 10 13 45 - 10 5 42 * 10 4 42 * 10 9 59 ; 11 Y 61 = |
10 4 42 * 10 1024 59 ; 3 if 40 ( 11 X 14 >= 11 Y 41 ) 123 { 3 if 40 ( 11 i 13 == 11 i |
41 ) 123 { 11 X 61 = 11 Y 125 } 125 } 59 ; 59 ; 59 ; 59 ; 5 while 40 ( 11 X 60 <
|
11 Y 41 ) 123 { 11 X 61 = 11 X 43 + 10 1 59 ; 125 } 125 } |
语法分析
C语言子集,可支持
语句块,语句,条件语句,While循环语句,赋值语句,基本算术表达式等。例如:
{
// Comment Supported : This is only a Test ^_^
X = 12 + b / 13 - 5 * 4 * 9; // A AssignmentStatement
Y = 4 * 1024;
if( X >= Y){
if( i == i){ // This is nested if Statement
X=Y;
}
}
;;;; // This is Null Statement
while( X < Y){ // This is while Statement
X = X +1;
}
}
测试程序1-1
支持错误检测,如将上面例子中X = 12 + b / 13 - 5 * 4 * 9;
故意修改为:X = 12 ++ b / 13 - 5 * 4 * 9; 则会出现如下错误提示,指示了出错行数和行内偏移位置:
规则如下:
<StatementBlock> ::= '{'<StatementSequence>'}'
<StatementSequence> ::= {<NullStatement>|<CommonStatement>|<VariantStatement>}
<NullStatement> ::= ';'
<CommonStatement> ::= <AssignmentStatement>
<VariantStatement> ::= <ConditionStatement>| <LoopWhileStatement>
<AssignmentStatement> ::= ID=<Expression>
<ConditionStatement> ::= if(<Condition> <StatementBlock>
<LoopWhileStatement> ::= while(<Condition> <StatementBlock>
<Condition> ::= <Expression><RelationOperator><Expression>
<Expression> ::= <Item>{+<Item>|-<Item>}
<Item> ::= <Factor>{*<Factor>|/<Factor>}
<Factor> ::= ID|NUM|(<Expression>)
<RelationOperator> ::= <|<=|>=|>|==|!=
//非终结符的英文定义
void StatementBlock(); //语句块
void StatementSequence(); //语句串
// XxxxxStatement() 为三类语句
void NullStatement(); //空语句--仅仅含有一个;号
void CommonStatement(); //语句
void VariantStatement(); //变种语句--包括 if(){},while{},他们都不以;结尾
// 下面的属于CommonStatement
void AssignmentStatement(); //赋值语句
// 下面两种属于VariantStatement
void ConditionStatement(); //条件语句
void LoopWhileStatement(); //while循环语句
void Condition(); //条件
void Expression(); //表达式
void Item(); //项
void Factor(); //因子
void RelationOperator(); //关系运算符
不能支持的主要方面:函数调用的识别,逗号表达式,for循环,switch语句。
词法分析:
//
LexAly.cpp :C子集词法分析程序
data:image/s3,"s3://crabby-images/5bd17/5bd1786902cebb06aebbcf14deee58e186e3a7a2" alt=""
/**/
/*
支持内容:
标识符:id
关键字: int,char,if,else,while,do,for
标号: ,, ., ;
算术运算符号: =,+,-,&,!,|,&&,||
data:image/s3,"s3://crabby-images/5226a/5226ab9e8c2a9d9c900f5c95a5f80319d932cdb7" alt=""
全局字符串:
instr 记录待解析的字符串
string 存贮当前被解析到的ID
data:image/s3,"s3://crabby-images/5f751/5f75114c5737e7a3e611377dbe23b36a2c541b6b" alt=""
接口:
gettoken();
data:image/s3,"s3://crabby-images/e3998/e39984c2abf5a2f1ec40165554575382d665b943" alt=""
data:image/s3,"s3://crabby-images/49f23/49f23e883ecb058b10dae2f3e27dfa68f2968db1" alt=""
data:image/s3,"s3://crabby-images/ce103/ce10356c04a1e6d97727bf569051079865451d63" alt=""
Sample:
输入:
instr =
for(i=0;i<10;i++){
j=i+10;
printf("%d",j);
}
输出:
for
(
i
……
}
data:image/s3,"s3://crabby-images/d16ff/d16fff1841670725f34a4a54a53d2b99524d4eb0" alt=""
data:image/s3,"s3://crabby-images/128f2/128f2b6518580d8492c086a674606e14834cacc6" alt=""
注意:
要记得处理程序中未显示出来的符号,如空白(' '),回车(' '),值表符(' ')
*/
data:image/s3,"s3://crabby-images/e772b/e772b4837c723cc261e127830ab7e96a6213c573" alt=""
#include
"
stdafx.h
"
#include
<
ctype.h
>
#include
<
stdlib.h
>
#include
<
string.h
>
#include
"
Constant.h
"
data:image/s3,"s3://crabby-images/03fba/03fba6c81a3d73ce7487eaa27045f67534c74d53" alt=""
extern
void
grammar_check();
data:image/s3,"s3://crabby-images/fb649/fb64952c54867da32f42df3dd73877ea3e6bbdbd" alt=""
data:image/s3,"s3://crabby-images/13242/1324240b633b1f4f7acbb86045ede4eab9a9e1d8" alt=""
//
注意:这里累计数目(最大值)不能大于32 (10 0000B)TOKEN
//
enum {END=0,INT=1,CHAR,IF,ELSE,WHILE,DO,FOR,ARGAND,ARGOR,NUM,ID} ;
data:image/s3,"s3://crabby-images/48b10/48b108a8443aaffe222e0f46cf08d63cc62584f7" alt=""
char
index[][
20
]
=
...
{
data:image/s3,"s3://crabby-images/469b5/469b50e5121743428d4110924de1dd1a95e48000" alt=""
...{"END OF File"}, /**//* 0 END*/
data:image/s3,"s3://crabby-images/f9359/f93595e8adec855d9db40ba41a4803971270fd5e" alt=""
...{"int"}, /**//* 1 INT*/
data:image/s3,"s3://crabby-images/31585/31585967acb4abd3612b1c87ea286b70eae54042" alt=""
...{"char"}, /**//* 2 CHAR*/
data:image/s3,"s3://crabby-images/20156/201560a83e3e2341c8e82805de26b6b073dbe8e3" alt=""
...{"if"}, /**//* 3 IF*/
data:image/s3,"s3://crabby-images/6a7ad/6a7ad2197ee8aca3a346e19b44edc3ab9c87d753" alt=""
...{"else"}, /**//* 4 ELSE*/
data:image/s3,"s3://crabby-images/3ff97/3ff976f6402d51fd120c427ebae6521a3d3125ad" alt=""
...{"while"}, /**//* 5 WHILE*/
data:image/s3,"s3://crabby-images/6bd63/6bd632ec29a2ba23bd04c12384cd2c5cb3a88ddf" alt=""
...{"do"}, /**//* 6 DO*/
data:image/s3,"s3://crabby-images/29585/29585af089a9fd3d52dd3797f60fbc922cedae27" alt=""
...{"for"}, /**//* 7 FOR*/
data:image/s3,"s3://crabby-images/54f53/54f531c00d1bfa142dd36ce91a85db8fdc7eca5a" alt=""
...{"&&"}, /**//* 8 ARGAND*/
data:image/s3,"s3://crabby-images/9a738/9a738b2d82fd3d87d179a668fd50791d2c85cc57" alt=""
...{"||"}, /**//* 9 ARGOR*/
data:image/s3,"s3://crabby-images/7a78a/7a78acf849c2cd3529c5cac5b49840d59a79c0d8" alt=""
...{""}, /**//* 10 NUM */
data:image/s3,"s3://crabby-images/61451/614511c6f62ff3a22f69afa038f57cc0c6d7187a" alt=""
...{""}, /**//* 11 ID */
data:image/s3,"s3://crabby-images/a985d/a985dc80447dbeb5245380dc74befd803bfae732" alt=""
...{"<="}, /**//* 12 LESSEQUAL */
data:image/s3,"s3://crabby-images/6c73f/6c73fa50b464ebe4970086a2a9a588889a9e5348" alt=""
...{"=="}, /**//* 13 EQUAL */
data:image/s3,"s3://crabby-images/c6c6d/c6c6d2d10a7c6e2396f5a04d49f574aed0dddbb0" alt=""
...{">="}, /**//* 14 GREATEQUAL */
data:image/s3,"s3://crabby-images/ea921/ea921232a7496022e060eadb6fd7daa7b4178436" alt=""
...{"!="}, /**//* 15 NOTEQUAL */
data:image/s3,"s3://crabby-images/3b17e/3b17ea6a53cb5fdf180993f751dc8a4362bde7b6" alt=""
...{""} /**//* 16 ID */
}
;
data:image/s3,"s3://crabby-images/eaaa9/eaaa994a5650aac88ecb386749d2ef1fdf17289c" alt=""
data:image/s3,"s3://crabby-images/c0971/c097147b793849cb271e638d3d7c8cf8c2e20455" alt=""
char
input[
10000
]
=
...
{0}
;
data:image/s3,"s3://crabby-images/18663/18663f5543ec618d61474beb993c7e53a17e9629" alt=""
char
*
instr
=
input;
char
*
const
start_of_instr
=
input;
data:image/s3,"s3://crabby-images/fefef/fefef3a9e5960fda4035a1d62bc3e0fd4218b279" alt=""
//
string 包含gettoken最新得到的id等串
//
gym包含 gettoken得到的内容的代号
//
current_line 包含当前行号
char
string[MAX_INDENT];
int
sym;
int
current_line
=
1
;
int
start_pos_of_current_line;
data:image/s3,"s3://crabby-images/9b8fa/9b8fa26de3a477b379be72af438892cbdae67f4e" alt=""
char
*
strstart;
//
用于辅助识别num,id
int
gettoken();
int
_gettoken();
data:image/s3,"s3://crabby-images/53d2d/53d2d2a42dd83ab736f7a6daf6b227ce43eee5a1" alt=""
void
error(
char
*
cur);
char
*
getlinestring(
int
line,
char
*
in_buf);
int
nextline();
int
getline();
int
getcurrentpos();
data:image/s3,"s3://crabby-images/a6ab2/a6ab2bb80e064b52cb72c20478d29658fefb7587" alt=""
data:image/s3,"s3://crabby-images/663cb/663cb3284e67ff2a6d4af6e3a49984f652faf301" alt=""
data:image/s3,"s3://crabby-images/107a1/107a174da05ddc2afd815b19a62657cc673907f9" alt=""
int
nextline()
...
{ return ++current_line; }
data:image/s3,"s3://crabby-images/ac994/ac9941b8cbd3d2e8dac1f730985d4e7b554bbf39" alt=""
int
getline()
...
{ return current_line; }
data:image/s3,"s3://crabby-images/123a4/123a429e61d67ef200ae2b229c50ccf0703fb0dd" alt=""
int
getcurrentpos()
...
{ return (int)instr; }
data:image/s3,"s3://crabby-images/a5a66/a5a66a4946ffcd8ec1d21fcd2ca70a260cc6205d" alt=""
char
*
getlinestring(
int
line,
char
*
in_buf)
data:image/s3,"s3://crabby-images/4fd14/4fd145a8c8fc18954794ba8acc33afa015bd0777" alt=""
...
{
char * t = input;
int i = 1;
data:image/s3,"s3://crabby-images/7a1ed/7a1ed2ff29a30d4814f96e3ac8630f656861ee1b" alt=""
data:image/s3,"s3://crabby-images/a69e3/a69e32b0824011358bb52b5b73f7dc584ed72265" alt=""
while(*t != 0 && i < line )...{
if( *t==' ' ) i++;
t++;
}
data:image/s3,"s3://crabby-images/c9191/c9191330035668c66f765a993156e3c0cb8d855d" alt=""
int len = 0;
data:image/s3,"s3://crabby-images/938a2/938a2b7084ab2c27bdeb211a04e8321cac532cea" alt=""
while ( *t != ' ' )...{
in_buf[len] = *t;
len++;
t++;
}
in_buf[len] = 0;
return in_buf;
}
data:image/s3,"s3://crabby-images/09713/0971323ffd3bc420ca9598d6c122fa5f9129682f" alt=""
void
error(
char
*
cur)
data:image/s3,"s3://crabby-images/91729/91729d27109070b83e1e4d9f207621cee08f77ea" alt=""
...
{
printf("Spell Error found at line %d ",getline());
exit(0);
}
data:image/s3,"s3://crabby-images/708d3/708d3060a29f1e998ea5fab5d766c0b58506fb56" alt=""
data:image/s3,"s3://crabby-images/bee1f/bee1f8fe395a0be0ca05868792994b9b65e2b5f0" alt=""
//
语法分析
int
main_grammar(
char
*
filename)
data:image/s3,"s3://crabby-images/253c8/253c898b5d00fd059181fd8c1b12086ffac5ffe3" alt=""
...
{
int i;
data:image/s3,"s3://crabby-images/f74bf/f74bf4d021fa1e46a95c5e03504faaaf9e596d6a" alt=""
FILE *f;
data:image/s3,"s3://crabby-images/e6f2e/e6f2e8325d37022fc941e6ab82fefb682b1fc8f4" alt=""
if(!(f=fopen(filename,"r")))...{
printf("Fail to open source file %s! ",filename);
exit(0);
}
int k=0;
char c;
while((c=fgetc(f))!=EOF)
data:image/s3,"s3://crabby-images/541b4/541b4ec9cbcb9e3d6380a1d8420bffacd76726b4" alt=""
...{
input[k]=c;
k++;
}
input[k] = 0;
//打印出程序
printf("%s ",start_of_instr);
data:image/s3,"s3://crabby-images/6a1c9/6a1c985d3d52e2d4aad57708db4eb12709f78ad8" alt=""
//开始语法检查
grammar_check();
data:image/s3,"s3://crabby-images/41102/411021a420d77151de976145f2d838b93d095a9a" alt=""
printf("Success! ");
return 0;
}
data:image/s3,"s3://crabby-images/b1bf4/b1bf4f3448550bfbf40ebbd8daf0b626f74011c6" alt=""
//
词法分析
int
main_spell(
char
*
filename)
data:image/s3,"s3://crabby-images/e1681/e1681a1ccab021fe22542cae0b1f71406ada8871" alt=""
...
{
int i;
data:image/s3,"s3://crabby-images/b1d94/b1d94db3f50de42563031544dd7891c7ac6de8da" alt=""
FILE *f;
data:image/s3,"s3://crabby-images/3ef58/3ef58a0e8785eb202d96925ea0fbe3eeb4cdfa04" alt=""
if(!(f=fopen(filename,"r")))...{
printf("Fail to open source file %s! ",filename);
exit(0);
}
data:image/s3,"s3://crabby-images/05a93/05a93c0f543f3458e46b50fbff9f4d4d05914761" alt=""
data:image/s3,"s3://crabby-images/8a226/8a22648a13c68e60314b67c373e165b292aa6334" alt=""
int k=0;
char c;
while((c=fgetc(f))!=EOF)
data:image/s3,"s3://crabby-images/c02b0/c02b0493f7ba3c278d95f02c95e89d1808cd1607" alt=""
...{
input[k]=c;
k++;
}
data:image/s3,"s3://crabby-images/db3bc/db3bc496a78b876fe50425efc6c0e1d8c811d344" alt=""
input[k] = 0;
data:image/s3,"s3://crabby-images/c5a43/c5a4383c30be499cb9f2809be8933c3b88ec4059" alt=""
printf("%s ",start_of_instr);
data:image/s3,"s3://crabby-images/c5bc1/c5bc161811066d472739a54301116b0719501f87" alt=""
data:image/s3,"s3://crabby-images/898a3/898a3426b3524eab99402b9ddd7284a4f96b3ec2" alt=""
while((i=gettoken())!=END)
data:image/s3,"s3://crabby-images/58e47/58e478df657b8b0748216751fc567a6350e1020f" alt=""
...{
data:image/s3,"s3://crabby-images/25453/25453c531eb25c1b6f044201db0f4a461c35a488" alt=""
if(i == ID)...{
printf("%d %s ",i,string);
continue;
}
data:image/s3,"s3://crabby-images/3bfbf/3bfbf316a5bd72ab90cacd0af554287d421a0e94" alt=""
if(i == NUM)...{
printf("%d %s ",i,string);
continue;
}
data:image/s3,"s3://crabby-images/b4499/b4499ff24a4bf9fdff4c0e1cf078bf2b970d67c2" alt=""
data:image/s3,"s3://crabby-images/0b09a/0b09a221a64aafa2c5047465a2f16b8c62a5873b" alt=""
if(i<20)...{
printf("%d %s ",i,index[i]);
data:image/s3,"s3://crabby-images/95255/95255627a44f901db76d386a0d5fc07adc979586" alt=""
}else...{
printf("%d %c ",i,i);
}
}
data:image/s3,"s3://crabby-images/05532/055321d73e93e748e8e0b5529fad571c14e5e24e" alt=""
return 0;
}
data:image/s3,"s3://crabby-images/dcfae/dcfaece19c309481d918cc49497384cbb880b8e9" alt=""
int
gettoken()
data:image/s3,"s3://crabby-images/9926e/9926ee1fbcad9bf9b6de20e25e0745011d25d92d" alt=""
...
{
int i= (sym = _gettoken());
data:image/s3,"s3://crabby-images/fd162/fd1622f4f3cdcd4c6b0c823eb16ecc1df92bc371" alt=""
#if 0
data:image/s3,"s3://crabby-images/015e4/015e4ac55842ebd083cab2d6ff95a5e7ce838701" alt=""
if(i == ID)...{
printf("%s",string);
}
data:image/s3,"s3://crabby-images/d4cca/d4ccaf78e10e86b7ce349eb312871c0beebde4f2" alt=""
if(i == NUM)...{
printf("%s",string);
}
data:image/s3,"s3://crabby-images/dcf00/dcf00ddc9fba1d9276343bbe7510cf17ca0ccfaf" alt=""
data:image/s3,"s3://crabby-images/53db1/53db15c5c7bc994734217e591e6b6edc9cff3e99" alt=""
if(i<20)...{
printf("%s",index[i]);
data:image/s3,"s3://crabby-images/7436f/7436f910178f09df93a3c259b31033fd0ae02c47" alt=""
}else...{
printf("%c",i);
}
#endif
return sym;
}
data:image/s3,"s3://crabby-images/35af2/35af2cc918d2b2593575f730d1416a41dcffa506" alt=""
data:image/s3,"s3://crabby-images/e23ae/e23aed4b711a76d15e252b27a8ba9ef9f36647d5" alt=""
int
_gettoken()
data:image/s3,"s3://crabby-images/52d65/52d65bc785c562ed623db0330a0f31ffe3995830" alt=""
...
{
char *cp = instr;
data:image/s3,"s3://crabby-images/6dcf6/6dcf662639bfb695609ca1dad861ec47d3725692" alt=""
data:image/s3,"s3://crabby-images/3a496/3a49637aa62e915db85f75cf28d825587304c4d5" alt=""
for(;;)...{
if( *instr == 0)
return END;
data:image/s3,"s3://crabby-images/f924c/f924cf74b1374023c39e8ea2a547c008cdfb556f" alt=""
/**//*
if( 可能读入的字符 > 当前可用缓冲区大小 )
扩展缓冲区
*/
//int,char,if,else,while,do,for
switch ( *instr )
data:image/s3,"s3://crabby-images/a06b8/a06b81738208d8b7b40a73f76549b64a651bcbdf" alt=""
...{
case 'i':
if( instr[1] == 'f' && notda(instr[2]) )
data:image/s3,"s3://crabby-images/4f4c8/4f4c83d67a7c4b69731d8b0e350cad013084d438" alt=""
...{
instr+=2;return IF;
}
if( instr[1] == 'n' && instr[2] == 't' && notda(instr[3]) )
data:image/s3,"s3://crabby-images/1ed3b/1ed3b51fccd71bb7f7bad3326a05d52f5ea7e987" alt=""
...{
instr+=3; return INT;
}
// not a keyword. but an id.
strstart = instr;
instr++;
goto id_label;
case 'c':
if( instr[1] == 'h' && instr[2] == 'a' && instr[3] == 'r' && notda(instr[4]) )
data:image/s3,"s3://crabby-images/fb71d/fb71d37c47f8c9fa186886d1d38b46097939c61b" alt=""
...{instr+=4;return CHAR; }
strstart = instr;
instr++;
goto id_label;
break;
case 'e':
if( instr[1] == 'l' && instr[2] == 's' && instr[3] == 'e' && notda(instr[4]) )
data:image/s3,"s3://crabby-images/b6f7a/b6f7af3f940f28c3700a02c55a1157522799c9da" alt=""
...{instr+=4;return ELSE; }
strstart = instr;
instr++;
goto id_label;
break;
case 'w':
if( instr[1] == 'h' && instr[2] == 'i' && instr[3] == 'l' && instr[4] == 'e' && notda(instr[5]) )
data:image/s3,"s3://crabby-images/b0370/b03707a8cf3a82ff323d103aeb51dac696e55b4f" alt=""
...{instr+=5;return WHILE; }
strstart = instr;
instr++;
goto id_label;
case 'd':
if( instr[1] == 'o' && notda(instr[4]) )
data:image/s3,"s3://crabby-images/f8d5e/f8d5ef8530adaae68fcb0780617412524b34d1e1" alt=""
...{instr+=2;return DO; }
strstart = instr;
instr++;
goto id_label;
case 'f':
if( instr[1] == 'o' && instr[2] == 'r' && notda(instr[3]) )
data:image/s3,"s3://crabby-images/ef6d7/ef6d7806ec4d7ac177696ec215ef0ea214ca082a" alt=""
...{instr+=3;return FOR; }
strstart = instr;
instr++;
goto id_label;
// deal with IDs.
// EXCLUDE:i,c,d,e,w,f
case 'a': ; case 'b': ;
case 'g': ; case 'h': ;
case 'j': ; case 'k': ; case 'l': ;
case 'm': ; case 'n': ; case 'o': ;
case 'p': ; case 'q': ; case 'r': ;
case 's': ; case 't': ; case 'u': ;
case 'v': ; case 'x': ;
case 'y': ; case 'z': ;
case 'A': ; case 'B': ;
case 'C': ; case 'D': ; case 'E': ;
case 'F': ; case 'G': ; case 'H': ;
case 'I': ; case 'J': ; case 'K': ;
case 'L': ; case 'M': ; case 'N': ;
case 'O': ; case 'P': ; case 'Q': ;
case 'R': ; case 'S': ; case 'T': ;
case 'U': ; case 'V': ; case 'W': ;
case 'X': ; case 'Y': ; case 'Z': ;
strstart = instr;
instr++;
goto id_label;
data:image/s3,"s3://crabby-images/b04b8/b04b89678252fde7df740145f4111691e7af0e02" alt=""
case '0': ;
case '1': ; case '2': ; case '3': ;
case '4': ; case '5': ; case '6': ;
case '7': ; case '8': ; case '9': ;
strstart = instr;
instr++;
goto num_label;
data:image/s3,"s3://crabby-images/c5e4a/c5e4abf9e565826608ff0fd0b95f8327580da247" alt=""
case '{':
instr++;
return '{';
case '}':
instr++;
return '}';
case '(':
instr++;
return '(';
case ')':
instr++;
return ')';
case '+':
instr++;
return '+';
case '-':
instr++;
return '-';
case '*':
instr++;
return '*';
case '/':
data:image/s3,"s3://crabby-images/f9b02/f9b02718f7a71b12ab74bf20903230956cd9705b" alt=""
if( instr[1] == '/' )...{ // ‘//’形式的注释
instr += 2;
while( *(instr) != 10 && *(instr) != 0 )
instr ++;
// instr ++;
data:image/s3,"s3://crabby-images/0032e/0032ec63754be02a3ac4ec1ce25443e47053ab59" alt=""
}else...{ // 除号'/'
instr++;
return '/';
}
break;
case '=':
data:image/s3,"s3://crabby-images/b2822/b282295961c2bad9c764f80a524cc53c1838b3bc" alt=""
if( instr[1] == '=') ...{instr+=2; return EQUAL; }
data:image/s3,"s3://crabby-images/003db/003db7ff6d0326bdc733d7271944a475dcc5dcf0" alt=""
else ...{instr++; return '=';}
break;
case '<':
data:image/s3,"s3://crabby-images/492a2/492a21bfa8d4f6b717dc8ef5bedc0ae27b1c0cbb" alt=""
if( instr[1] == '=') ...{instr+=2; return LESSEQUAL; }
data:image/s3,"s3://crabby-images/f83c5/f83c50c7c4d3545802b58a1d327484c31a58ab9a" alt=""
else ...{instr++; return '<';}
break;
case '>':
data:image/s3,"s3://crabby-images/65284/6528483205294b7863d0eb98d021c4b8310970c0" alt=""
if( instr[1] == '=') ...{instr+=2; return GREATEQUAL; }
data:image/s3,"s3://crabby-images/79b88/79b88fd559ed9193e408ebe7573171b192edd9df" alt=""
else ...{instr++; return '>';}
break;
case '!':
data:image/s3,"s3://crabby-images/d7858/d7858135e676c5c7c6f3e1b6db1662494462bef1" alt=""
if( instr[1] == '=') ...{instr+=2; return NOTEQUAL; }
data:image/s3,"s3://crabby-images/39e23/39e231d329328a0f54abcb2cd90525e315f06df0" alt=""
else ...{instr++; return '!';}
break;
data:image/s3,"s3://crabby-images/5a26f/5a26f99db67093d19c8b4c5749f17e1fc88d1151" alt=""
case '&':
data:image/s3,"s3://crabby-images/caf77/caf77bee44fee671bdc01850d7ed47fcd1f0ec48" alt=""
if( instr[1] == '&') ...{instr+=2; return ARGAND; }
data:image/s3,"s3://crabby-images/0000b/0000b14ed9e46519efa789dd6b92353888bd6ce8" alt=""
if( instr[1] == '&' && (isid(instr[2]) || isspace(instr[2])) )...{ instr++; return '&'; }
error(instr);
break;
data:image/s3,"s3://crabby-images/d7ca8/d7ca8866c496cad55513725cb594ac4554d48fb7" alt=""
case '|':
data:image/s3,"s3://crabby-images/5cbcd/5cbcdb4e30a77c051a9c8d7fe97be3891cb16951" alt=""
if( instr[1] == '|') ...{instr+=2; return ARGAND; }
data:image/s3,"s3://crabby-images/a0503/a0503de707094d17d251958b0ec6494e18ef6c56" alt=""
if( instr[1] == '|' && (isid(instr[2]) || isspace(instr[2])) )...{ instr++; return '|'; }
error(instr);
break;
data:image/s3,"s3://crabby-images/8fca5/8fca575e435de088420b8727819a85f1cdbdd799" alt=""
case ';':
instr++;
return ';';
case ' ':
//printf("new line (%d) ",getline());
nextline();
instr++;
start_pos_of_current_line = (int)instr;
break;
default:
instr++;
break;
id_label:
while( isid(*instr) )
instr++;
strncpy(string,strstart,instr-strstart);
string[instr-strstart]=0;
return ID;
num_label:
while( isdigit(*instr) )
instr++;
data:image/s3,"s3://crabby-images/d43fb/d43fb91303c00c15e21de1fe1c1518204d9eeb62" alt=""
// if(isalpha(*(instr+1))
// error(instr); 让语法分析来做吧~
data:image/s3,"s3://crabby-images/ed3ad/ed3ad86d000894e799b952b908b2fc1e8451b17f" alt=""
strncpy(string,strstart,instr-strstart);
string[instr-strstart]=0;
return NUM;
}
data:image/s3,"s3://crabby-images/f22bd/f22bd35c5c4e8a107dd5398c30681fa50c0faa44" alt=""
data:image/s3,"s3://crabby-images/06a95/06a952559800911bb209593830b0e6370c77630b" alt=""
data:image/s3,"s3://crabby-images/8ba57/8ba57281f36e4c7a87ba7866ec9dc15a51e21f46" alt=""
}
}
data:image/s3,"s3://crabby-images/095d4/095d47601eb203930d279f6145b691ebd765ba56" alt=""
data:image/s3,"s3://crabby-images/4e16d/4e16d0e1920906592321240f362cc12be5664ed5" alt=""
int
main(
int
argc,
char
*
argv[])
data:image/s3,"s3://crabby-images/3a828/3a8281f94a1ea7975cae677385dc5369ebba17bb" alt=""
...
{
data:image/s3,"s3://crabby-images/21f4d/21f4dc2e4b8df6a7c57a54451a3230271876a428" alt=""
if(argc <= 1 || argc >=4) ...{
printf("Usage:>LexAly [g|s] [filename] ");
exit(0);
}
data:image/s3,"s3://crabby-images/f5278/f527831cd414303e7395e67ae7c2ac9d78e7ea87" alt=""
data:image/s3,"s3://crabby-images/90d22/90d22a30f859b800c26716253c87e74f1149bc22" alt=""
if(argc == 3 )...{
argv[1][0] == 'g'? main_grammar(argv[2]): main_spell(argv[2]);
data:image/s3,"s3://crabby-images/28dcb/28dcb56178d95372e0d92520b58926ef59edbcac" alt=""
}else if(argc == 2)...{
argv[1][0] == 'g'? main_grammar("source2.txt") : main_spell("source2.txt");
;
}
return 0;
}
//
grammar.cpp :C子集语法分析程序
data:image/s3,"s3://crabby-images/9b09b/9b09bab999763befc30800b23489379feba498de" alt=""
/**/
/*
C语言子集,可支持
语句块,语句,条件语句,While循环语句,赋值语句,基本算术表达式等。例如:
{
// Comment Supported : This is only a Test ^_^
data:image/s3,"s3://crabby-images/70938/7093892aadb7ea61436a32fa16f0e87db6d19483" alt=""
X = 12 + b / 13 - 5 * 4 * 9; // A AssignmentStatement
Y = 4 * 1024;
data:image/s3,"s3://crabby-images/e037d/e037d27b773ae521d06c9b617ba8365f41549132" alt=""
if( X >= Y){
if( i == i){ // This is nested if Statement
X=Y;
}
}
data:image/s3,"s3://crabby-images/5c5b9/5c5b9b0d0ec1e528bd9dc5b2062041f1ae178ba3" alt=""
;;;; // This is Null Statement
data:image/s3,"s3://crabby-images/fef0f/fef0fa066bcb899ff9d2f56088fdba2b16e38de1" alt=""
while( X < Y){ // This is while Statement
X = X +1;
}
}
data:image/s3,"s3://crabby-images/1e480/1e4803307d97f0af7a5b0890c82bb24796912649" alt=""
规则如下:
data:image/s3,"s3://crabby-images/31e27/31e275468be5644fc3a79a1bc0fac225ff460b0f" alt=""
<StatementBlock> ::= '{'<StatementSequence>'}'
<StatementSequence> ::= {<NullStatement>|<CommonStatement>|<VariantStatement>}
data:image/s3,"s3://crabby-images/20481/204816933ec9f110ef290237a45a369fa717ec16" alt=""
<NullStatement> ::= ';'
<CommonStatement> ::= <AssignmentStatement>
<VariantStatement> ::= <ConditionStatement>| <LoopWhileStatement>
data:image/s3,"s3://crabby-images/adf44/adf449476c39af68bfc9a3d6e9735dae7e8adf3c" alt=""
<AssignmentStatement> ::= ID=<Expression>
<ConditionStatement> ::= if(<Condition> <StatementBlock>
<LoopWhileStatement> ::= while(<Condition> <StatementBlock>
data:image/s3,"s3://crabby-images/56620/56620a00320571f3e2a613fa731ab7176e7b8cda" alt=""
<Condition> ::= <Expression><RelationOperator><Expression>
<Expression> ::= <Item>{+<Item>|-<Item>}
<Item> ::= <Factor>{*<Factor>|/<Factor>}
<Factor> ::= ID|NUM|(<Expression>)
<RelationOperator> ::= <|<=|>=|>|==|!=
data:image/s3,"s3://crabby-images/4ef52/4ef5271d660bb51bfa7a1df6c132d35810effc47" alt=""
*/
data:image/s3,"s3://crabby-images/fdcbd/fdcbd5ae2721285af6fcd42c9fb14f687ef896df" alt=""
data:image/s3,"s3://crabby-images/a9656/a96566849151b756340abfdd9d880a9b8ce90dd7" alt=""
data:image/s3,"s3://crabby-images/bcbb1/bcbb145573ea41a6c4f53f765a773edd24489909" alt=""
#include
"
stdafx.h
"
#include
<
ctype.h
>
#include
<
conio.h
>
#include
<
stdlib.h
>
#include
<
string.h
>
data:image/s3,"s3://crabby-images/33918/33918b5f597e4379df868192991d2bb41395bbdb" alt=""
#include
"
Constant.h
"
data:image/s3,"s3://crabby-images/64b3d/64b3dda087f432524a3b84646e8974c1cbacf160" alt=""
extern
int
gettoken();
extern
int
getcurrentpos();
extern
char
*
string;
extern
int
sym;
extern
int
current_line;
extern
int
start_pos_of_current_line;
extern
char
*
getlinestring(
int
line,
char
*
in_buf);
extern
char
input[];
data:image/s3,"s3://crabby-images/85d49/85d497c5870ac73d076da9e321e9111c01261445" alt=""
//
非终结符的英文定义
void
StatementBlock();
//
语句块
void
StatementSequence();
//
语句串
data:image/s3,"s3://crabby-images/4c7b9/4c7b988b816e1e20f5532cc4cd016e46dcc999e0" alt=""
//
XxxxxStatement() 为三类语句
void
NullStatement();
//
空语句--仅仅含有一个;号
void
CommonStatement();
//
语句
void
VariantStatement();
//
变种语句--包括 if(){},while{},他们都不以;结尾
data:image/s3,"s3://crabby-images/075de/075de6d99b6b5d8414e3def437955b6733a1ca7b" alt=""
//
下面的属于CommonStatement
void
AssignmentStatement();
//
赋值语句
data:image/s3,"s3://crabby-images/57685/57685e8aa236fd22715ef6d5bd60fd4c96f68acd" alt=""
//
下面两种属于VariantStatement
void
ConditionStatement();
//
条件语句
void
LoopWhileStatement();
//
while循环语句
void
Condition();
//
条件
void
Expression();
//
表达式
void
Item();
//
项
void
Factor();
//
因子
void
RelationOperator();
//
关系运算符
data:image/s3,"s3://crabby-images/9c124/9c124df70339f6c98e1c6e5d6bf9876f55f5de96" alt=""
/**/
/*
注:以上未考虑函数调用表达式
*/
data:image/s3,"s3://crabby-images/339b0/339b08bf37d074614f82845b4114c9fc52d43a3b" alt=""
data:image/s3,"s3://crabby-images/05d34/05d3405049e69f95e1b31b56609fe7b045bdf0bc" alt=""
void
match_error(
char
*
c)
data:image/s3,"s3://crabby-images/40125/401254879378e1f6943fe27836d9d38ec9c2ac3b" alt=""
...
{
char error_buf[1024];
int in_line_pos = getcurrentpos()-start_pos_of_current_line;
data:image/s3,"s3://crabby-images/a3908/a3908896c9bf3d28acb304abd3b7d7b78c08c7a0" alt=""
printf("Grammar Error! ");
printf("Line %d[%d] : %s expected ",current_line,in_line_pos,c);
//获取错误行并打印出来
getlinestring(current_line,error_buf);
printf("%s ",error_buf);
//输出错误指示点(Not Exact!)
for(int i=1; i< in_line_pos; i++)
printf("%c",'^');
printf(" ");
data:image/s3,"s3://crabby-images/8f174/8f17408760a348a7c1f3b8b6095d4eb4b37ff76e" alt=""
exit(0);
}
data:image/s3,"s3://crabby-images/c5003/c5003897d8a501472fc14640204b5a848b5e3e32" alt=""
//
expecetedSym 期望符号
//
msg 出错时给出的消息
void
match(
int
expecetedSym,
char
*
msg)
data:image/s3,"s3://crabby-images/40dc7/40dc7e4732f4a4213d9ab180de63375e3d931b28" alt=""
...
{
data:image/s3,"s3://crabby-images/18975/189751488e0f2cf1ed46045e74dadb35623ac6cd" alt=""
if(expecetedSym != sym)...{
#if 0
if(sym < 0x20 )
printf(" Fail: ExpecetedSym=%d sym=%d ",expecetedSym,sym);
else
printf(" Fail: ExpecetedSym=%d sym=%c ",expecetedSym,sym);
#endif
match_error(msg);
}
gettoken(); //预读一个符号
data:image/s3,"s3://crabby-images/70181/70181dbd472e9b34e30f05266866ce9131520c77" alt=""
}
void
grammar_check()
data:image/s3,"s3://crabby-images/f0b0a/f0b0a900257dcffdb18fc630ef7f2b38b626c94e" alt=""
...
{
data:image/s3,"s3://crabby-images/ef1df/ef1df5700a47e1fd0d1e59d8a99db0355fd619bf" alt=""
// printf("%s",input);
gettoken(); //开始检查,填充预读区
// match('-',"DK");
StatementBlock();
if(sym != END) match(END,"End Of File");
}
data:image/s3,"s3://crabby-images/91418/91418ae56d0f47d4662b280c3f79375a2d43202a" alt=""
void
StatementBlock()
//
语句块
data:image/s3,"s3://crabby-images/36249/362498848d15016b4352f2b4a960b6edfe21869e" alt=""
...
{
match('{',"{"); //和预读符号比较
StatementSequence();
match('}',"}");
}
data:image/s3,"s3://crabby-images/919a0/919a059f02d33856e7b6bf4f8e98d99c9e81b35a" alt=""
void
StatementSequence()
//
语句串
data:image/s3,"s3://crabby-images/a8304/a8304666ef5041fc958904983bf14181bdfc0c7d" alt=""
...
{
data:image/s3,"s3://crabby-images/adcef/adcefd7dd1833315f7da83fe1d172d1895d0f2f6" alt=""
while(sym == ID ||
sym == IF ||
sym == WHILE||
sym == ';')
data:image/s3,"s3://crabby-images/f6b72/f6b723d7d19d97451e0377d557e864208521ef9c" alt=""
...{
while(sym == ID) //也可以用if(),但从统计角度看,while效率会略高。
//因为一般普通CommonStatement()出现概率较大
data:image/s3,"s3://crabby-images/758f5/758f510e4e31d6fcdee7e3699583a5ce2f95178b" alt=""
...{
CommonStatement();
match(';',";");
}
while(sym == IF ||
sym == WHILE)
data:image/s3,"s3://crabby-images/fdf19/fdf19cbe7b5e2dc18b7bcab8552ad80244fc72e8" alt=""
...{
VariantStatement();
}
while(sym == ';')
data:image/s3,"s3://crabby-images/fd441/fd441e0b9a0663c8ed82d1e8c0c4edfb0afc3bc4" alt=""
...{
NullStatement();
}
}
}
data:image/s3,"s3://crabby-images/f448f/f448fdb42aca1061cbea951a1308cc2964b35b91" alt=""
void
VariantStatement()
//
变种语句--包括 if(){},while{},他们都不以;结尾
data:image/s3,"s3://crabby-images/675dc/675dc1784615b6dc060151a062e76296ee67c4e0" alt=""
...
{
data:image/s3,"s3://crabby-images/32b79/32b799ad54a8f3f4bb9f0727fab4975729d12ec1" alt=""
switch(sym)...{ //若sym与下面两种均不匹配,什么也不做,空语句是也~
case IF:
ConditionStatement(); //条件语句
break;
case WHILE:
LoopWhileStatement();
break;
}
return;
}
data:image/s3,"s3://crabby-images/91095/910950bb3ee145db557cb3c540d33ebe54ade3de" alt=""
void
NullStatement()
//
空语句--仅仅含有一个;号
data:image/s3,"s3://crabby-images/808f5/808f535b36add4707f1f0c73f5a514b51522c947" alt=""
...
{
match(';',";");
}
data:image/s3,"s3://crabby-images/7eeac/7eeac675cf62d17c3d2cb1f1974f11ce36377484" alt=""
void
CommonStatement()
//
语句,以;结尾,但不以;开头
data:image/s3,"s3://crabby-images/23481/23481312eebaf7937174476ed1ab4db10487d15b" alt=""
...
{
data:image/s3,"s3://crabby-images/dd1bb/dd1bb980e2d60c2eb0d642e50aa9c091f8677280" alt=""
switch(sym)...{ //若sym与下面任何一种均不匹配,什么也不做,空语句是也~
case ID:
AssignmentStatement();
break;
}
return;
}
data:image/s3,"s3://crabby-images/19222/19222ee9fa23e4865d28cb37a19469cfcd5c13c9" alt=""
void
AssignmentStatement()
//
赋值语句
data:image/s3,"s3://crabby-images/554dc/554dc04aab8ce0396c88e09b7f177700a0d900e5" alt=""
...
{
match(ID,"ID");
match('=',"=");
Expression();
}
data:image/s3,"s3://crabby-images/0af6e/0af6ee35409ac95f1e42822918edf642c8c7c5b5" alt=""
void
ConditionStatement()
//
条件语句
data:image/s3,"s3://crabby-images/06264/062644a4244fe7fcd433301334f16a47d6dcb4b6" alt=""
...
{
match(IF,"if");
match('(',"(");
Condition();
match(')',")");
StatementBlock();
}
data:image/s3,"s3://crabby-images/37b37/37b37054687b22162fb19d7e904206b695fe0320" alt=""
void
LoopWhileStatement()
//
循环语句
data:image/s3,"s3://crabby-images/e19a7/e19a7f7a853d1265049a77d7add41a5bc6dd7cbc" alt=""
...
{
match(WHILE,"while");
match('(',"(");
Condition();
match(')',")");
StatementBlock();
}
data:image/s3,"s3://crabby-images/dfe93/dfe931c7c2afa67e7bd72c10108ad96463c8b8b0" alt=""
void
Condition()
//
条件
data:image/s3,"s3://crabby-images/002cb/002cb43c8e2f9149fea78dfd77c6cd706f7de2ed" alt=""
...
{
Expression();
RelationOperator();
Expression();
}
data:image/s3,"s3://crabby-images/b9a60/b9a60f70546c3f56dd7713d46f6455acb8e887ac" alt=""
//
<Expression> ::= <Item>{+<Item>|-<Item>}
void
Expression()
//
表达式
data:image/s3,"s3://crabby-images/7e15b/7e15b018983945142a5d917023fc456f65cd82bf" alt=""
...
{
Item();
data:image/s3,"s3://crabby-images/38fae/38faeb396fa566c04cb26d4b1b8cdb8a87a48f6e" alt=""
while(true)...{ // {+<Item>|-<Item>} 可以有多个
data:image/s3,"s3://crabby-images/944af/944af8d6ac7991198dc782f0018b900016bbc533" alt=""
switch(sym)...{
case '+':
match('+',"+");
Item();
break;
case '-':
match('-',"-");
Item();
break;
default:
return;
}
}
return;
data:image/s3,"s3://crabby-images/3869d/3869decfde96dc3416b67bfad5bdcd58727b3edc" alt=""
}
//
<Item> ::= <Factor>{*<Factor>|/<Factor>}
void
Item()
//
项
data:image/s3,"s3://crabby-images/5ee8d/5ee8df322410ceb16965d748f0f92bad000fc2e1" alt=""
...
{
Factor();
data:image/s3,"s3://crabby-images/6c310/6c310837c0add60776996970b2046935108af63f" alt=""
while(true)...{ // {*<Factor>|/<Factor>} -- 可以有多个
data:image/s3,"s3://crabby-images/217c1/217c1057f0ee7871bc293041340a2b58b48379d1" alt=""
switch(sym)...{
case '*':
match('*',"*");
Factor();
break;
case '/':
match('/',"/");
Factor();
break;
default:
return;
}
}
return;
}
//
<Factor> ::= ID|NUM|(<Expression>)
void
Factor()
//
因子
data:image/s3,"s3://crabby-images/c1768/c17683430d1171906a543771e0c8dbcc1580eb84" alt=""
...
{
data:image/s3,"s3://crabby-images/afd55/afd55b8c5d01a2b81e4c69692e9e9b4583924eab" alt=""
switch(sym)...{
case ID:
match(ID,"ID");
break;
case NUM:
match(NUM,"NUM");
break;
case '(':
match('(',"(");
Expression();
match(')',")");
break;
default:
match(ID,"A factor "); // ID在这里肯定不match,利用它来报错(找不到因子)
break;
}
}
//
<RelationOperator> ::= <|<=|>=|>|==|!=
void
RelationOperator()
//
关系运算符
data:image/s3,"s3://crabby-images/27af0/27af0bdef91990a2e3020312a1d07fa8da065420" alt=""
...
{
data:image/s3,"s3://crabby-images/138d6/138d6d31de49bb37d29a3c921fc83dd73121b7cc" alt=""
switch(sym)...{
case '<':
match('<',"<");
break;
case '>':
match('>',">");
break;
case LESSEQUAL:
match(LESSEQUAL,"<=");
break;
case GREATEQUAL:
match(GREATEQUAL,">=");
break;
case EQUAL:
match(EQUAL,"==");
break;
case NOTEQUAL:
match(NOTEQUAL,"!=");
break;
}
}
核心:规则----
<StatementBlock> ::= '{'<StatementSequence>'}'
<StatementSequence> ::= {<NullStatement>|<CommonStatement>|<VariantStatement>}
<NullStatement> ::= ';'
<CommonStatement> ::= <AssignmentStatement>
<VariantStatement> ::= <ConditionStatement>| <LoopWhileStatement>
<AssignmentStatement> ::= ID=<Expression>
<ConditionStatement> ::= if(<Condition> <StatementBlock>
<LoopWhileStatement> ::= while(<Condition> <StatementBlock>
<Condition> ::= <Expression><RelationOperator><Expression>
<Expression> ::= <Item>{+<Item>|-<Item>}
<Item> ::= <Factor>{*<Factor>|/<Factor>}
<Factor> ::= ID|NUM|(<Expression>)
<RelationOperator> ::= <|<=|>=|>|==|!=