Nasal-Interpreter/version0.9/nasal_parser.h

535 lines
12 KiB
C++

#ifndef __NASAL_PARSER_H__
#define __NASAL_PARSER_H__
#include <stack>
enum token_type
{
__stack_end=1,
__equal,// =
__cmp_equal,// ==
__cmp_not_equal,// !=
__cmp_less,__cmp_less_or_equal,// < <=
__cmp_more,__cmp_more_or_equal,// > >=
__and_operator,__or_operator,__nor_operator,// and or !
__add_operator,__sub_operator,__mul_operator,__div_operator,__link_operator,// + - * / ~
__add_equal,__sub_equal,__mul_equal,__div_equal,__link_equal,// += -= *= /= ~=
__left_brace,__right_brace,// {}
__left_bracket,__right_bracket,// []
__left_curve,__right_curve,// ()
__semi,// ;
__comma,// ,
__colon,// :
__dot,// .
__var,
__func,
__id,
__return,
__if,__elsif,__else,
__continue,__break,__for,__forindex,__foreach,__while,
__scalar,
__number,__string,__char,
__list,
__hash,
__hash_member,
__statement,
__function,
__call_function,
__definition,
__assignment,
__calculation,
__loop,
__choose,
__program
};
const int max_len=10;
struct cmp_seq
{
int tokens[max_len];
int res;
};
// must put in a reverse way
cmp_seq par[]=
{
{{__program,__statement}, __program},
{{__semi,__number,__equal,__id,__var},__definition},
{{__definition}, __statement}
};
int num_of_par=sizeof(par)/sizeof(cmp_seq);
void print_token(int type)
{
std::string context="";
switch(type)
{
case __stack_end:
context="#";
break;
case __equal:
context="=";
break;
case __cmp_equal:
context="==";
break;
case __cmp_not_equal:
context="!=";
break;
case __cmp_less:
context="<";
break;
case __cmp_less_or_equal:
context="<=";
break;
case __cmp_more:
context=">";
break;
case __cmp_more_or_equal:
context=">=";
break;
case __and_operator:
context="and";
break;
case __or_operator:
context="or";
break;
case __nor_operator:
context="!";
break;
case __add_operator:
context="+";
break;
case __sub_operator:
context="-";
break;
case __mul_operator:
context="*";
break;
case __div_operator:
context="/";
break;
case __link_operator:
context="~";
break;
case __add_equal:
context="+=";
break;
case __sub_equal:
context="-=";
break;
case __mul_equal:
context="*=";
break;
case __div_equal:
context="/=";
break;
case __link_equal:
context="~=";
break;
case __left_brace:
context="{";
break;
case __right_brace:
context="}";
break;
case __left_bracket:
context="[";
break;
case __right_bracket:
context="]";
break;
case __left_curve:
context="(";
break;
case __right_curve:
context=")";
break;
case __semi:
context=";";
break;
case __comma:
context=",";
break;
case __colon:
context=":";
break;
case __dot:
context=".";
break;
case __var:
context="var";
break;
case __func:
context="func";
break;
case __id:
context="id";
break;
case __number:
context="number";
break;
case __string:
context="string";
break;
case __char:
context="char";
break;
case __continue:
context="continue";
break;
case __break:
context="break";
break;
case __for:
context="for";
break;
case __forindex:
context="forindex";
break;
case __foreach:
context="foreach";
break;
case __while:
context="while";
break;
case __if:
context="if";
break;
case __elsif:
context="elsif";
break;
case __else:
context="else";
break;
case __return:
context="return";
break;
case __scalar:
context="scalar";
break;
case __list:
context="list";
break;
case __hash:
context="hash";
break;
case __hash_member:
context="hash_member";
break;
case __statement:
context="statement";
break;
case __function:
context="function";
break;
case __call_function:
context="call_func";
break;
case __definition:
context="definition";
break;
case __assignment:
context="assignment";
break;
case __calculation:
context="calc";
break;
case __loop:
context="loop";
break;
case __choose:
context="choose";
break;
case __program:
context="program";
break;
}
std::cout<<context;
return;
}
struct parse_unit
{
int line;
int type;
};
class PDA
{
private:
std::stack<int> main_stack;
std::stack<int> comp_stack;
public:
void set_stack_empty()
{
while(!main_stack.empty())
main_stack.pop();
while(!comp_stack.empty())
comp_stack.pop();
main_stack.push(__stack_end);
comp_stack.push(__stack_end);
comp_stack.push(__program);
}
void stack_input(std::stack<parse_unit>& temp)
{
set_stack_empty();
while(!temp.empty())
{
main_stack.push(temp.top().type);
temp.pop();
}
return;
}
void print_stack(std::stack<int>& temp)
{
std::stack<int> t;
while(!temp.empty())
{
t.push(temp.top());
print_token(t.top());
std::cout<<" ";
temp.pop();
}
while(!t.empty())
{
temp.push(t.top());
t.pop();
}
return;
}
void print_main_and_comp()
{
std::cout<<">>[Main stack] ";
print_stack(main_stack);
std::cout<<std::endl<<">>[Comp stack] ";
print_stack(comp_stack);
std::cout<<std::endl;
return;
}
bool reducable()
{
std::stack<int> temp;
for(int i=0;i<num_of_par;++i)
{
for(int j=max_len-1;j>=0;--j)
{
if(!par[i].tokens[j])
continue;
// if par[i].tokens[j] is 0 then continue until the tokens[j] is not 0
temp.push(comp_stack.top());
comp_stack.pop();
if((par[i].tokens[j]!=temp.top()) || (comp_stack.empty() && par[i].tokens[j]))
{
while(!temp.empty())
{
comp_stack.push(temp.top());
temp.pop();
}
break;
}
if((par[i].tokens[j]==temp.top()) && (j==0))
{
comp_stack.push(par[i].res);
return true;
}
}
}
return false;
}
void main_comp_progress(bool show)
{
if(show)
print_main_and_comp();
while(main_stack.top()!=__stack_end)
{
comp_stack.push(main_stack.top());
main_stack.pop();
if(show)
print_main_and_comp();
while(1)
{
if(!reducable())
break;
if(show)
print_main_and_comp();
}
}
if(comp_stack.top()==__program)
{
comp_stack.pop();
if(comp_stack.top()==__stack_end)
std::cout<<">>[Parse] 0 error(s)."<<std::endl;
else
std::cout<<">>[Parse] Error:"<<std::endl;
}
else
std::cout<<">>[Parse] Error:"<<std::endl;
std::cout<<">>[Parse] Complete checking."<<std::endl;
//print_error();
return;
}
};
class nasal_parser
{
private:
std::stack<parse_unit> parser;
public:
void parse_process(std::list<token>& lexer,bool show)
{
while(!parser.empty())
parser.pop();
for(std::list<token>::iterator i=lexer.begin();i!=lexer.end();++i)
{
parse_unit temp_parse;
temp_parse.line=(*i).line;
if(((*i).content=="var") || ((*i).content=="func") || ((*i).content=="return") || ((*i).content=="nil") || ((*i).content=="continue") || ((*i).content=="break") || ((*i).content=="and") || ((*i).content=="or"))
{
if((*i).content=="var")
temp_parse.type=__var;
else if((*i).content=="func")
temp_parse.type=__func;
else if((*i).content=="return")
temp_parse.type=__return;
else if((*i).content=="nil")
temp_parse.type=__number;
else if((*i).content=="continue")
temp_parse.type=__continue;
else if((*i).content=="break")
temp_parse.type=__break;
else if((*i).content=="and")
temp_parse.type=__and_operator;
else if((*i).content=="or")
temp_parse.type=__or_operator;
}
else if((*i).type==IDENTIFIER)
{
temp_parse.type=__id;
}
else if(((*i).content=="for") || ((*i).content=="foreach") || ((*i).content=="while") || ((*i).content=="forindex"))
{
if((*i).content=="for")
temp_parse.type=__for;
else if((*i).content=="forindex")
temp_parse.type=__forindex;
else if((*i).content=="foreach")
temp_parse.type=__foreach;
else if((*i).content=="while")
temp_parse.type=__while;
}
else if(((*i).content=="if") || ((*i).content=="else") || ((*i).content=="elsif"))
{
if((*i).content=="if")
temp_parse.type=__if;
else if((*i).content=="else")
temp_parse.type=__else;
else if((*i).content=="elsif")
temp_parse.type=__elsif;
}
else if(((*i).content=="==") || ((*i).content=="!=") || ((*i).content==">") || ((*i).content==">=") || ((*i).content=="<") || ((*i).content=="<="))
{
if((*i).content=="==")
temp_parse.type=__cmp_equal;
else if((*i).content=="!=")
temp_parse.type=__cmp_not_equal;
else if((*i).content==">")
temp_parse.type=__cmp_more;
else if((*i).content==">=")
temp_parse.type=__cmp_more_or_equal;
else if((*i).content=="<")
temp_parse.type=__cmp_less;
else if((*i).content=="<=")
temp_parse.type=__cmp_less_or_equal;
}
else if(((*i).content==";") || ((*i).content==",") || ((*i).content=="=") || ((*i).content==":") || ((*i).content=="."))
{
if((*i).content==";")
temp_parse.type=__semi;
else if((*i).content==",")
temp_parse.type=__comma;
else if((*i).content=="=")
temp_parse.type=__equal;
else if((*i).content==":")
temp_parse.type=__colon;
else if((*i).content==".")
temp_parse.type=__dot;
}
else if(((*i).type==NUMBER) || ((*i).type==STRING) || ((*i).type==CHAR))
{
if((*i).type==NUMBER)
temp_parse.type=__number;
else if((*i).type==STRING)
temp_parse.type=__string;
else if((*i).type==CHAR)
temp_parse.type=__char;
}
else if(((*i).content=="+") || ((*i).content=="-") || ((*i).content=="*") || ((*i).content=="/") || ((*i).content=="~") || ((*i).content=="!"))
{
if((*i).content=="+")
temp_parse.type=__add_operator;
else if((*i).content=="-")
temp_parse.type=__sub_operator;
else if((*i).content=="*")
temp_parse.type=__mul_operator;
else if((*i).content=="/")
temp_parse.type=__div_operator;
else if((*i).content=="~")
temp_parse.type=__link_operator;
else if((*i).content=="!")
temp_parse.type=__nor_operator;
}
else if(((*i).content=="+=") || ((*i).content=="-=") || ((*i).content=="*=") || ((*i).content=="/=") || ((*i).content=="~="))
{
if((*i).content=="+=")
temp_parse.type=__add_equal;
else if((*i).content=="-=")
temp_parse.type=__sub_equal;
else if((*i).content=="*=")
temp_parse.type=__mul_equal;
else if((*i).content=="/=")
temp_parse.type=__div_equal;
else if((*i).content=="~=")
temp_parse.type=__link_equal;
}
else if(((*i).content=="(") || ((*i).content==")") || ((*i).content=="[") || ((*i).content=="]") || ((*i).content=="{") || ((*i).content=="}"))
{
char c=(*i).content[0];
switch(c)
{
case '(':
temp_parse.type=__left_curve;
break;
case ')':
temp_parse.type=__right_curve;
break;
case '[':
temp_parse.type=__left_bracket;
break;
case ']':
temp_parse.type=__right_bracket;
break;
case '{':
temp_parse.type=__left_brace;
break;
case '}':
temp_parse.type=__right_brace;
break;
}
}
parser.push(temp_parse);//push this into stack
}
std::stack<parse_unit> temp;
while(!parser.empty())
{
temp.push(parser.top());
parser.pop();
}
PDA automata;
automata.stack_input(temp);
automata.main_comp_progress(show);
return;
}
};
#endif