diff --git a/lexical_analysis.cpp b/lexical_analysis.cpp index 7cfbcf4..b92a3a8 100644 --- a/lexical_analysis.cpp +++ b/lexical_analysis.cpp @@ -2,13 +2,14 @@ #include #include -#define SELFDEFINE -1 //自定义标识符 -#define IDENTIFIER -2 //界符 or 运算符 -#define NUMBER -3 //数字 -#define RESERVEWORD -4//关键字 -#define FAIL -5 //失败 -#define SCANEND -6 //扫描完成 -#define ERRORFOUND -7 //异常错误 +#define IDENTIFIER -1 //自定义标识符 +#define OPERATOR -2 //界符 or 运算符 +#define NUMBER -3 //数字 +#define RESERVEWORD -4 //关键字 +#define STRING -5 //字符串类型 +#define FAIL -6 //失败 +#define SCANEND -7 //扫描完成 +#define ERRORFOUND -8 //异常错误 // \n 换行 // \t tab @@ -16,13 +17,13 @@ // \\ 反斜线 // \' 单引号 // \" 双引号 -std::string ReserveWord[27]= +std::string ReserveWord[26]= { "for","foreach","forindex","while", "var","func","break","continue","return", "if","else","elsif","nil","and","or", "print","cmp","append","setsize","subvec","pop", - "sort","contains","delete","keys","typeof","id" + "sort","contains","delete","keys","typeof" }; std::string OperatorOrDelimiter[40]= @@ -35,11 +36,11 @@ std::string OperatorOrDelimiter[40]= }; std::string IdentifierTable[1000]={""}; -char ResourcePrograme[16384]; +char ResourcePrograme[16777216]; int isReserveWord(std::string &p) { - for(int i=0;i<27;++i) + for(int i=0;i<26;++i) if(ReserveWord[i]==p) return i+1; return FAIL; @@ -55,12 +56,12 @@ int isOperatorOrDelimiter(std::string &p) bool isLetter(char t) { - return ('a'<=t && t<='z' || 'A'<=t && t<='Z'); + return (('a'<=t) && (t<='z') || ('A'<=t) && (t<='Z')); } bool isNumber(char t) { - return ('0'<=t && t<='9'); + return (('0'<=t) && (t<='9')); } void InputFile(std::string &FileName) @@ -122,7 +123,7 @@ void Scanner(int &Syn,const char Source[],std::string &token,int &ptr) } Syn=isReserveWord(token); if(Syn==FAIL) - Syn=SELFDEFINE; + Syn=IDENTIFIER; else Syn=RESERVEWORD; } @@ -145,17 +146,17 @@ void Scanner(int &Syn,const char Source[],std::string &token,int &ptr) Syn=NUMBER; } else if(temp=='(' || temp==')' || temp=='[' || temp==']' || temp=='{' || - temp=='}' || temp==',' || temp==';' || temp=='\"' || temp==':' || - temp=='?' || temp=='.' || temp=='`' || temp=='\'' || temp=='&' || - temp=='|') + temp=='}' || temp==',' || temp==';' || temp=='|' || temp==':' || + temp=='?' || temp=='.' || temp=='`' || temp=='\'' || temp=='&'|| + temp=='%' || temp=='$' || temp=='^') { token+=temp; ++ptr; - Syn=IDENTIFIER; + Syn=OPERATOR; } else if(temp=='=' || temp=='+' || temp=='-' || temp=='*' || temp=='!' || temp=='/' || temp=='<' || temp=='>' || temp=='~') { - Syn=IDENTIFIER; + Syn=OPERATOR; token+=temp; ++ptr; temp=Source[ptr]; @@ -167,13 +168,7 @@ void Scanner(int &Syn,const char Source[],std::string &token,int &ptr) } else if(temp=='\\') { - /* - "+","-","*","/","=","+=","-=","*=","/=", - "\n","\t","\r","\\","\'","\"",".", - "<","<=",">",">=","==","!=","!","~", - ",",";","(",")","[","]","{","}","#" - */ - Syn=IDENTIFIER; + Syn=OPERATOR; token+=temp; ++ptr; temp=Source[ptr]; @@ -183,6 +178,43 @@ void Scanner(int &Syn,const char Source[],std::string &token,int &ptr) ++ptr; } } + else if(temp=='\"') + { + Syn=STRING; + token+=temp; + ++ptr; + temp=Source[ptr]; + while(temp!='\"') + { + if(temp=='\\') + { + token+=temp; + + ++ptr; + temp=Source[ptr]; + token+=temp; + + ++ptr; + temp=Source[ptr]; + } + else + { + token+=temp; + ++ptr; + temp=Source[ptr]; + } + if(temp=='@' || temp=='\n') + break; + } + //add the last char \" + if(temp=='\"') + { + token+=temp; + ++ptr; + } + else + token+=" __missing_end_of_string"; + } else if(temp=='@') { Syn=SCANEND; @@ -192,10 +224,10 @@ void Scanner(int &Syn,const char Source[],std::string &token,int &ptr) { Syn=FAIL; std::cout<<"[Error] Unexpected error occurred: "<> Complete scanning \""<