#include "stdafx.h"
enum WORD_TYPE_ENUM{//單詞型別列舉值
INVALID_WORD,
IDENTIFIER,
NUMBER,
CONST,
VAR,
PROCEDURE,
BEGIN,
END,
IF,
THEN,
WHILE,
DO,
WRITE,
READ,
CALL,
LEFT_PARENTHESIS,
RIGHT_PARENTHESIS,
COMMA,
SEMICOLON,
PERIOD,
PLUS,
MINUS,
MULTIPLY,
DIVIDE,
ODD,
EQL,
NEQ,
LES,
LEQ,
GTR,
GEQ,
ASSIGN,
ZIZENG,
ZIJIAN,
EQLS,
};
//保留字的名字字串和型別對照表結構
struct RESERVED_WORD_NAME_VS_TYPE_STRUCT{
char szName[20];//保留字的名字字串
enum WORD_TYPE_ENUM eType;//保留字的單詞型別列舉值
};
#define MAX_LENGTH_OF_A_WORD 10 //一個單詞的最多字符個數
#define MAX_NUMBER_OF_WORDS 1000 //可識別的最多單詞個數
#define NUMBER_OF_RESERVED_WORDS 13 //保留字個數
struct WORD_STRUCT{//一個單詞的資料結構
char szName[MAX_LENGTH_OF_A_WORD];//單詞名字的字串
enum WORD_TYPE_ENUM eType;//單詞型別列舉值
int nNumberValue;//數單詞的值
int nLineNo;//在源代碼檔案中單詞所在的行數
};
RESERVED_WORD_NAME_VS_TYPE_STRUCT ReservedWordNameVsTypeTable[NUMBER_OF_RESERVED_WORDS];//保留字的名字字串和型別對照表
WORD_TYPE_ENUM SingleCharacterWordTypeTable[256];//單字符單詞的字符和型別對照表
WORD_STRUCT g_Words[MAX_NUMBER_OF_WORDS];//已識別出的單詞佇列
int g_nWordsIndex;//已識別出的單詞的個數或序號
int g_nLineNo=1;//檔案中源代碼的行數
extern FILE *fpSourceFile;//源程式檔案的檔案指標
int WordTypeToString(char string[100],WORD_TYPE_ENUM eWordType);
void PrintInLexis(int nWordsIndex);
int GetAWord();
void InitializeReservedWordTable()//設定保留字單詞的名字字串和相應型別的對照表
{
strcpy(ReservedWordNameVsTypeTable[0].szName,"begin"); ReservedWordNameVsTypeTable[0].eType=BEGIN;
strcpy(ReservedWordNameVsTypeTable[1].szName,"call"); ReservedWordNameVsTypeTable[1].eType=CALL;
strcpy(ReservedWordNameVsTypeTable[2].szName,"const"); ReservedWordNameVsTypeTable[2].eType=CONST;
strcpy(ReservedWordNameVsTypeTable[3].szName,"do"); ReservedWordNameVsTypeTable[3].eType=DO;
strcpy(ReservedWordNameVsTypeTable[4].szName,"end"); ReservedWordNameVsTypeTable[4].eType=END;
strcpy(ReservedWordNameVsTypeTable[5].szName,"if"); ReservedWordNameVsTypeTable[5].eType=IF;
strcpy(ReservedWordNameVsTypeTable[6].szName,"odd"); ReservedWordNameVsTypeTable[6].eType=ODD;
strcpy(ReservedWordNameVsTypeTable[7].szName,"procedure");ReservedWordNameVsTypeTable[7].eType=PROCEDURE;
strcpy(ReservedWordNameVsTypeTable[8].szName,"read"); ReservedWordNameVsTypeTable[8].eType=READ;
strcpy(ReservedWordNameVsTypeTable[9].szName,"then"); ReservedWordNameVsTypeTable[9].eType=THEN;
strcpy(ReservedWordNameVsTypeTable[10].szName,"var"); ReservedWordNameVsTypeTable[10].eType=VAR;
strcpy(ReservedWordNameVsTypeTable[11].szName,"while"); ReservedWordNameVsTypeTable[11].eType=WHILE;
strcpy(ReservedWordNameVsTypeTable[12].szName,"write"); ReservedWordNameVsTypeTable[12].eType=WRITE;
}
void InitializeSingleCharacterTable()//設定單字符單詞的字符和相應型別的對照表
{
int i;
for(i=0;i<=255;i++)
{
SingleCharacterWordTypeTable[i]=INVALID_WORD;
}
SingleCharacterWordTypeTable['+']=PLUS;
SingleCharacterWordTypeTable['-']=MINUS;
SingleCharacterWordTypeTable['*']=MULTIPLY;
SingleCharacterWordTypeTable['/']=DIVIDE;
SingleCharacterWordTypeTable['(']=LEFT_PARENTHESIS;
SingleCharacterWordTypeTable[')']=RIGHT_PARENTHESIS;
// SingleCharacterWordTypeTable['=']=EQL;
//表示相等關系的單詞“=”改為“= =”
SingleCharacterWordTypeTable[',']=COMMA;
SingleCharacterWordTypeTable['.']=PERIOD;
SingleCharacterWordTypeTable['#']=NEQ;
SingleCharacterWordTypeTable[';']=SEMICOLON;
// SingleCharacterWordTypeTable['++']=ZIZENG; //自增@@@
// SingleCharacterWordTypeTable['--']=ZIJIAN; //自減@@@
}
//詞法分析
void LexicalAnalysis()
{
int nResult;
InitializeReservedWordTable();//設定保留字單詞的名字字串和相應型別的對照表
InitializeSingleCharacterTable();//設定單字符單詞的字符和相應型別的對照表
fseek(fpSourceFile, 0L, SEEK_SET);//源程式檔案的檔案指標指向起始位置
printf("\n----------------Lexical Analysis Begin!--------------\n");
g_nWordsIndex=0;//g_nWordsIndex是已識別單詞的序號
nResult=GetAWord();//詞法分析,識別第一個單詞
while(nResult==OK && g_nWordsIndex>=1)
{
PrintInLexis(g_nWordsIndex-1);//列印一個單詞
nResult=GetAWord();//詞法分析,識別下一個單詞
}
printf("----------------Lexical Analysis Funished!--------------\n");
}
//從檔案中讀取一個字符然后回傳
char GetACharacterFromFile()
{
char cACharacter;
//從檔案中讀取的一個字符
if(fscanf(fpSourceFile,"%c",&cACharacter)==EOF)
cACharacter=EOF;
if(cACharacter==RETURN)//如果是回車符
g_nLineNo++;//源代碼行數加一
return cACharacter;//回傳從檔案中讀取的一個字符
}
int GetAWord()//詞法分析,獲取一個單詞
{
static char cACharacter=SPACE;//當前字符
int nAWordIndex;//單詞陣列下標,表示單詞第幾個字符
int nDigitNumber;//數單詞的字符個數
int i;
char szAWord[MAX_LENGTH_OF_A_WORD+1];
int nNumberValue; //數的值
//忽略空格、換行和TAB
while((cACharacter==SPACE || cACharacter==RETURN || cACharacter==TABLE) && cACharacter!=EOF)
cACharacter=GetACharacterFromFile();//從檔案中讀取一個字符然后回傳
if(cACharacter!=EOF)//如果不是檔案末尾
{
if((cACharacter>='a' && cACharacter<='z')||(cACharacter>='A' && cACharacter<='Z')||(cACharacter=='_'))//如果當前字符是小寫的字母 改成大寫字母????????
{//識別符號或保留字以a..z開頭或A...Z開頭?????
nAWordIndex=0;//單詞的第一個字符
do{
if(nAWordIndex<MAX_LENGTH_OF_A_WORD)
szAWord[nAWordIndex++]=cACharacter;//把當前字符放進單詞陣列里,單詞陣列下標加一
cACharacter=GetACharacterFromFile();//從檔案中再讀取一個字符
}while((cACharacter>='a' && cACharacter<='z') || (cACharacter>='0' && cACharacter<='9') || (cACharacter>='A' && cACharacter<='Z') || cACharacter=='_' || cACharacter!=EOF);
//只要后面繼續跟a..z或0..9,就要繼續看后面的字符
//當前字符不再是a..z或0..9
if(cACharacter!=EOF)//如果不是檔案末尾
{
szAWord[nAWordIndex]=0;//以0結尾,在單詞陣列中組成一個單詞字串
for(i=0;i<NUMBER_OF_RESERVED_WORDS;i++)//從保留字表中查詢當前單詞字串是否為某一保留字字串
if(strcmp(szAWord,ReservedWordNameVsTypeTable[i].szName)==0)
{
//如果是保留字,則賦當前單詞型別為相應保留字的單詞型別列舉值
g_Words[g_nWordsIndex].eType=ReservedWordNameVsTypeTable[i].eType;
break;
}
if(i>=NUMBER_OF_RESERVED_WORDS)
//如果在保留字表中查詢不出,則當前單詞是識別符號,單詞型別為單詞型別列舉值IDENTIFIER
g_Words[g_nWordsIndex].eType=IDENTIFIER;
strcpy(g_Words[g_nWordsIndex].szName,szAWord);//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
else
return ERROR;
}
else
//加 if(cACharacter>='0' && cACharacter<='9')
{//數字是以0..9開頭
nDigitNumber=0;//數單詞的字符個數
nNumberValue=https://bbs.csdn.net/topics/0;//數單詞的值
do{
szAWord[nDigitNumber++]=cACharacter;
nNumberValue=https://bbs.csdn.net/topics/10*nNumberValue+cACharacter-'0';//計算數單詞的值
cACharacter=GetACharacterFromFile();//再取下一個字符
}while(cACharacter>='0' && cACharacter<='9' && cACharacter=='_' && cACharacter!=EOF);//如果是0..9,則繼續拼裝數單詞 或以下劃線?????
uj5u.com熱心網友回復:
補充!//加 //如果不是0..9則數單詞結束
if(cACharacter!=EOF)
{
szAWord[nDigitNumber]=0;//以0結尾在單詞陣列中組成一個數單詞字串
g_Words[g_nWordsIndex].eType=NUMBER;//單詞型別為單詞型別列舉值NUMBER
strcpy(g_Words[g_nWordsIndex].szName,szAWord);//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nNumberValue=https://bbs.csdn.net/topics/nNumberValue;//同時將數的值賦給單詞的nNumberValue
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
else
return ERROR;
}
else
if(cACharacter==':')//當前符號是':'?
{
cACharacter=GetACharacterFromFile();//如果當前符號是':',則要再看下一個符號
if(cACharacter=='=')//如果下一個符號是'='
{//則單詞是賦值符號":="
g_Words[g_nWordsIndex].eType=ASSIGN;//單詞型別為單詞型別列舉值ASSIGN
strcpy(g_Words[g_nWordsIndex].szName,":=");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
}
else
if(cACharacter=='<')//檢測是"<"還是"<="單詞?
{
cACharacter=GetACharacterFromFile();//再取一個符號
if(cACharacter=='=')
{//單詞是"<="
g_Words[g_nWordsIndex].eType=LEQ;//單詞型別為單詞型別列舉值LEQ
strcpy(g_Words[g_nWordsIndex].szName,"<=");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
else
{//單詞僅是"<"
g_Words[g_nWordsIndex].eType=LES;//單詞型別為單詞型別列舉值LES
strcpy(g_Words[g_nWordsIndex].szName,"<");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
}
else
if(cACharacter=='>')//檢測是">"還是">="單詞?
{
cACharacter=GetACharacterFromFile();//再取一個符號
if(cACharacter=='=')
{//單詞是">="
g_Words[g_nWordsIndex].eType=GEQ;//單詞型別為單詞型別列舉值GEQ
strcpy(g_Words[g_nWordsIndex].szName,">=");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
}
else
{//單詞僅是">"
g_Words[g_nWordsIndex].eType=GTR;//單詞型別為單詞型別列舉值GTR
strcpy(g_Words[g_nWordsIndex].szName,">");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;
g_nWordsIndex++;//識別出的單詞個數加一
}
return OK;
}
//將<條件>中的表示相等關系的單詞“=”改為“= =”
else
if(cACharacter=='=')//檢測是"="還是"="單詞?
{
cACharacter=GetACharacterFromFile();//再取一個符號
if(cACharacter=='=')
{//單詞是"="
g_Words[g_nWordsIndex].eType=EQLS;//單詞型別為單詞型別列舉值EQL
strcpy(g_Words[g_nWordsIndex].szName,"==");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
else
{//單詞僅是"="
g_Words[g_nWordsIndex].eType=EQL;//單詞型別為單詞型別列舉值EQL
strcpy(g_Words[g_nWordsIndex].szName,"=");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
}
//增加用于識別自增
else
if(cACharacter=='+')//檢測是"++"還是"++"單詞?
{
cACharacter=GetACharacterFromFile();//再取一個符號
if(cACharacter=='+')
{//單詞是"="
g_Words[g_nWordsIndex].eType=ZIZENG;//單詞型別為單詞型別列舉值ZIZENG
strcpy(g_Words[g_nWordsIndex].szName,"++");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
else
{//單詞僅是"+"
g_Words[g_nWordsIndex].eType=PLUS;//單詞型別為單詞型別列舉值PLUS
strcpy(g_Words[g_nWordsIndex].szName,"+");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
}
//增加用于識別自減
else
if(cACharacter=='-')//檢測是"-"還是"-"單詞?
{
cACharacter=GetACharacterFromFile();//再取一個符號
if(cACharacter=='-')
{//單詞是"="
g_Words[g_nWordsIndex].eType=ZIJIAN;//單詞型別為單詞型別列舉值ZIJIAN
strcpy(g_Words[g_nWordsIndex].szName,"--");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
else
{//單詞僅是"-"
g_Words[g_nWordsIndex].eType=MINUS;//單詞型別為單詞型別列舉值MINUS
strcpy(g_Words[g_nWordsIndex].szName,"-");//識別出的單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;//在源代碼檔案中單詞所在的行數
g_nWordsIndex++;//識別出的單詞個數加一
return OK;
}
}
else
{//當不滿足上述條件時,則是單字符 這里的=改為==
//通過查表尋找單字符的單詞型別列舉值
g_Words[g_nWordsIndex].eType=SingleCharacterWordTypeTable[cACharacter];
g_Words[g_nWordsIndex].szName[0]=cACharacter;//單詞放進單詞佇列g_Words中
g_Words[g_nWordsIndex].szName[1]=0;//以0結尾組成一個字串
g_Words[g_nWordsIndex].nLineNo=g_nLineNo;
g_nWordsIndex++;//識別出的單詞個數加一
cACharacter=GetACharacterFromFile();//再取一個符號,為下一步準備
return OK;
}
}
return ERROR;
}
void PrintInLexis(int nIndex)//列印單詞佇列中的一個單詞
{
char szWordName[100];
char szWordType[100];
strcpy(szWordName,g_Words[nIndex].szName);
WordTypeToString(szWordType,g_Words[nIndex].eType);//將單詞型別的列舉值轉換成字串
switch(g_Words[nIndex].eType)
{
case IDENTIFIER:
printf("%-4d%-15s%-20s\n",nIndex,szWordName,szWordType);
break;
case NUMBER:
printf("%-4d%-15s%-20s%-10d\n",nIndex,szWordName,szWordType,g_Words[nIndex].nNumberValue);
break;
case CONST:
case VAR:
case PROCEDURE:
case BEGIN:
case END:
case IF:
case THEN:
case WHILE:
case DO:
case WRITE:
case READ:
case CALL:
case LEFT_PARENTHESIS:
case RIGHT_PARENTHESIS:
case COMMA:
case SEMICOLON:
case PERIOD:
case PLUS:
case MINUS:
case MULTIPLY:
case DIVIDE:
case ODD:
case EQL:
case NEQ:
case LES:
case LEQ:
case GTR:
case GEQ:
case ASSIGN:
case EQLS:
case ZIZENG: //自增!!!!
case ZIJIAN: //自減!!!!
printf("%-4d%-15s%-20s\n",nIndex,szWordName,szWordType);
break;
default:
printf("%-4d%-15s%-20s\n",nIndex,szWordName,szWordType);
}
}
//將單詞型別的列舉值轉換成字串
int WordTypeToString(char strString[100],WORD_TYPE_ENUM eWordType)
{
switch(eWordType)
{
case IDENTIFIER: strcpy(strString,"IDENTIFIER");
break;
case NUMBER: strcpy(strString,"NUMBER");
break;
case PLUS: strcpy(strString,"PLUS");
break;
case MULTIPLY: strcpy(strString,"MULTIPLY");
break;
case MINUS: strcpy(strString,"MINUS");
break;
case DIVIDE: strcpy(strString,"DIVIDE");
break;
case LES: strcpy(strString,"LES");
break;
case LEQ: strcpy(strString,"LEQ");
break;
case GTR: strcpy(strString,"GTR");
break;
case GEQ: strcpy(strString,"GEQ");
break;
case EQL: strcpy(strString,"EQL");
break;
case NEQ: strcpy(strString,"NEQ");
break;
case LEFT_PARENTHESIS: strcpy(strString,"LEFT_PARENTHESIS");
break;
case RIGHT_PARENTHESIS:strcpy(strString,"RIGHT_PARENTHESIS");
break;
case COMMA: strcpy(strString,"COMMA");
break;
case SEMICOLON: strcpy(strString,"SEMICOLON");
break;
case PERIOD: strcpy(strString,"PERIOD");
break;
case ASSIGN: strcpy(strString,"ASSIGN");
break;
case CONST: strcpy(strString,"CONST");
break;
case VAR: strcpy(strString,"VAR");
break;
case PROCEDURE: strcpy(strString,"PROCEDURE");
break;
case BEGIN: strcpy(strString,"BEGIN");
break;
case END: strcpy(strString,"END");
break;
case IF: strcpy(strString,"IF");
break;
case THEN: strcpy(strString,"THEN");
break;
case ODD: strcpy(strString,"ODD");
break;
case WHILE: strcpy(strString,"WHILE");
break;
case DO: strcpy(strString,"DO");
break;
case CALL: strcpy(strString,"CALL");
break;
case READ: strcpy(strString,"READ");
break;
case WRITE: strcpy(strString,"WRITE");
break;
case INVALID_WORD: strcpy(strString,"INVALID_WORD");
break;
}
return NULL;
}
uj5u.com熱心網友回復:
大家好 請幫幫忙 有些不清楚! 修改的地方請提示提示轉載請註明出處,本文鏈接:https://www.uj5u.com/houduan/111505.html
標籤:基礎類
上一篇:電腦問題啊
下一篇:請教LINK : fatal error LNK1104: cannot open file "?.exe"問題
