✨ change format of error info
parser now can report exact place where is lacking ';' or ','
This commit is contained in:
parent
a4a7f5075a
commit
c993c77b78
11
nasal.h
11
nasal.h
|
@ -148,6 +148,14 @@ int utf8_hdchk(char head)
|
||||||
return nbytes;
|
return nbytes;
|
||||||
}
|
}
|
||||||
|
|
||||||
|
std::string chrhex(const char c)
|
||||||
|
{
|
||||||
|
std::string res="";
|
||||||
|
res+="0123456789abcdef"[(c&0xf0)>>4];
|
||||||
|
res+="0123456789abcdef"[c&0x0f];
|
||||||
|
return res;
|
||||||
|
}
|
||||||
|
|
||||||
std::string rawstr(const std::string& str)
|
std::string rawstr(const std::string& str)
|
||||||
{
|
{
|
||||||
std::string ret("");
|
std::string ret("");
|
||||||
|
@ -159,8 +167,7 @@ std::string rawstr(const std::string& str)
|
||||||
if(i<=0)
|
if(i<=0)
|
||||||
{
|
{
|
||||||
ret+="\\x";
|
ret+="\\x";
|
||||||
ret+="0123456789abcdef"[(i>>4)&15];
|
ret+=chrhex(i);
|
||||||
ret+="0123456789abcdef"[i&15];
|
|
||||||
continue;
|
continue;
|
||||||
}
|
}
|
||||||
#endif
|
#endif
|
||||||
|
|
17
nasal_err.h
17
nasal_err.h
|
@ -46,30 +46,23 @@ private:
|
||||||
uint32_t error;
|
uint32_t error;
|
||||||
public:
|
public:
|
||||||
nasal_err():error(0){}
|
nasal_err():error(0){}
|
||||||
void err(const char* stage,const std::string& info,const char end='\n')
|
void err(const char* stage,const std::string& info)
|
||||||
{
|
{
|
||||||
++error;
|
++error;
|
||||||
std::cerr<<"["<<stage<<"] "<<info<<end;
|
std::cerr<<"["<<stage<<"] "<<info<<"\n";
|
||||||
}
|
}
|
||||||
void err(const char* stage,uint32_t line,uint32_t column,const std::string& info)
|
void err(const char* stage,uint32_t line,uint32_t column,const std::string& info)
|
||||||
{
|
{
|
||||||
++error;
|
++error;
|
||||||
if(!line)
|
const std::string& code=res[line-1];
|
||||||
{
|
std::cerr<<"["<<stage<<"] "<<file<<":"<<line<<":"<<column<<" "<<info<<"\n"<<code<<"\n";
|
||||||
std::cerr<<"["<<stage<<"] "<<file<<": "<<info<<'\n';
|
|
||||||
return;
|
|
||||||
}
|
|
||||||
std::cerr<<"["<<stage<<"] "<<file<<":"<<line<<":"<<column<<" "<<info<<"\n"<<res[line-1]<<'\n';
|
|
||||||
for(int i=0;i<(int)column-1;++i)
|
for(int i=0;i<(int)column-1;++i)
|
||||||
std::cerr<<char(" \t"[res[line-1][i]=='\t']);
|
std::cerr<<char(" \t"[code[i]=='\t']);
|
||||||
std::cerr<<"^\n";
|
std::cerr<<"^\n";
|
||||||
}
|
}
|
||||||
void err(const char* stage,uint32_t line,const std::string& info)
|
void err(const char* stage,uint32_t line,const std::string& info)
|
||||||
{
|
{
|
||||||
++error;
|
++error;
|
||||||
if(!line)
|
|
||||||
std::cerr<<"["<<stage<<"] "<<file<<": "<<info<<'\n';
|
|
||||||
else
|
|
||||||
std::cerr<<"["<<stage<<"] "<<file<<":"<<line<<" "<<info<<"\n"<<res[line-1]<<'\n';
|
std::cerr<<"["<<stage<<"] "<<file<<":"<<line<<" "<<info<<"\n"<<res[line-1]<<'\n';
|
||||||
}
|
}
|
||||||
void chkerr(){if(error)std::exit(1);}
|
void chkerr(){if(error)std::exit(1);}
|
||||||
|
|
|
@ -87,10 +87,14 @@ nasal_ast nasal_import::lib_import()
|
||||||
|
|
||||||
const std::vector<std::string> libpath=
|
const std::vector<std::string> libpath=
|
||||||
{
|
{
|
||||||
"lib.nas",
|
#ifdef __WIN32
|
||||||
"stl/lib.nas"
|
".\\lib.nas",
|
||||||
|
".\\stl\\lib.nas"
|
||||||
|
#else
|
||||||
|
"./lib.nas",
|
||||||
|
"./stl/lib.nas"
|
||||||
|
#endif
|
||||||
};
|
};
|
||||||
|
|
||||||
std::string filename="";
|
std::string filename="";
|
||||||
for(auto& i:libpath)
|
for(auto& i:libpath)
|
||||||
if(access(i.c_str(),F_OK)!=-1)
|
if(access(i.c_str(),F_OK)!=-1)
|
||||||
|
@ -103,7 +107,7 @@ nasal_ast nasal_import::lib_import()
|
||||||
std::string paths="";
|
std::string paths="";
|
||||||
for(auto& i:libpath)
|
for(auto& i:libpath)
|
||||||
paths+=" "+i+"\n";
|
paths+=" "+i+"\n";
|
||||||
nerr.err("link","cannot find lib file in these paths:\n"+paths,' ');
|
nerr.err("link","cannot find lib file in these paths:\n"+paths);
|
||||||
nerr.chkerr();
|
nerr.chkerr();
|
||||||
return {0,ast_root};
|
return {0,ast_root};
|
||||||
}
|
}
|
||||||
|
|
|
@ -15,11 +15,14 @@
|
||||||
|
|
||||||
enum token_type
|
enum token_type
|
||||||
{
|
{
|
||||||
tok_null=0,// null token default token type
|
tok_null=0, // null token (default token type)
|
||||||
tok_num, // number basic token type
|
tok_num, // number basic token type
|
||||||
tok_str, // string basic token type
|
tok_str, // string basic token type
|
||||||
tok_id, // identifier basic token type
|
tok_id, // identifier basic token type
|
||||||
tok_for,tok_forindex,tok_foreach,tok_while,
|
tok_for, // loop keyword for
|
||||||
|
tok_forindex,// loop keyword forindex
|
||||||
|
tok_foreach, // loop keyword foreach
|
||||||
|
tok_while, // loop keyword while
|
||||||
tok_var,tok_func,tok_break,tok_continue,
|
tok_var,tok_func,tok_break,tok_continue,
|
||||||
tok_ret,tok_if,tok_elsif,tok_else,tok_nil,
|
tok_ret,tok_if,tok_elsif,tok_else,tok_nil,
|
||||||
tok_lcurve,tok_rcurve,
|
tok_lcurve,tok_rcurve,
|
||||||
|
@ -106,20 +109,24 @@ class nasal_lexer
|
||||||
private:
|
private:
|
||||||
uint32_t line;
|
uint32_t line;
|
||||||
uint32_t column;
|
uint32_t column;
|
||||||
uint32_t ptr;
|
size_t ptr;
|
||||||
nasal_err& nerr;
|
nasal_err& nerr;
|
||||||
std::string res;
|
std::string res;
|
||||||
std::vector<token> tokens;
|
std::vector<token> tokens;
|
||||||
|
|
||||||
uint32_t get_type(const std::string&);
|
uint32_t get_type(const std::string&);
|
||||||
void die(std::string info){nerr.err("lexer",line,column,info);};
|
void die(const std::string& info){nerr.err("lexer",line,column,info);}
|
||||||
void open(const std::string&);
|
void open(const std::string&);
|
||||||
std::string utf8_gen();
|
std::string utf8_gen();
|
||||||
std::string id_gen();
|
std::string id_gen();
|
||||||
std::string num_gen();
|
std::string num_gen();
|
||||||
std::string str_gen();
|
std::string str_gen();
|
||||||
public:
|
public:
|
||||||
nasal_lexer(nasal_err& e):line(0),column(0),ptr(0),nerr(e){}
|
nasal_lexer(nasal_err& e):
|
||||||
|
line(1),
|
||||||
|
column(0),
|
||||||
|
ptr(0),
|
||||||
|
nerr(e){}
|
||||||
void scan(const std::string&);
|
void scan(const std::string&);
|
||||||
void print();
|
void print();
|
||||||
const std::vector<token>& get_tokens() const {return tokens;}
|
const std::vector<token>& get_tokens() const {return tokens;}
|
||||||
|
@ -162,16 +169,25 @@ std::string nasal_lexer::utf8_gen()
|
||||||
if(nbytes)
|
if(nbytes)
|
||||||
{
|
{
|
||||||
tmp+=res[ptr++];
|
tmp+=res[ptr++];
|
||||||
for(uint32_t i=0;i<nbytes;++i,++ptr)
|
++column;
|
||||||
|
for(uint32_t i=0;i<nbytes;++i,++ptr,++column)
|
||||||
if(ptr<res.size() && (res[ptr]&0xc0)==0x80)
|
if(ptr<res.size() && (res[ptr]&0xc0)==0x80)
|
||||||
tmp+=res[ptr];
|
tmp+=res[ptr];
|
||||||
if(tmp.length()!=1+nbytes)
|
if(tmp.length()!=1+nbytes)
|
||||||
die("invalid utf-8 character here");
|
{
|
||||||
|
std::string utf_info="0x"+chrhex(tmp[0]);
|
||||||
|
for(uint32_t i=1;i<tmp.size();++i)
|
||||||
|
utf_info+=" 0x"+chrhex(tmp[i]);
|
||||||
|
die("invalid utf-8 character `"+utf_info+"`, make sure this is a text file.");
|
||||||
|
std::exit(1);
|
||||||
|
}
|
||||||
str+=tmp;
|
str+=tmp;
|
||||||
++column;
|
|
||||||
}
|
}
|
||||||
else
|
else
|
||||||
|
{
|
||||||
++ptr;
|
++ptr;
|
||||||
|
++column;
|
||||||
|
}
|
||||||
}
|
}
|
||||||
return str;
|
return str;
|
||||||
}
|
}
|
||||||
|
@ -203,7 +219,7 @@ std::string nasal_lexer::num_gen()
|
||||||
str+=res[ptr++];
|
str+=res[ptr++];
|
||||||
column+=str.length();
|
column+=str.length();
|
||||||
if(str.length()<3)// "0x"
|
if(str.length()<3)// "0x"
|
||||||
die("invalid number:"+str);
|
die("invalid number `"+str+"`.");
|
||||||
return str;
|
return str;
|
||||||
}
|
}
|
||||||
// generate oct number
|
// generate oct number
|
||||||
|
@ -215,7 +231,7 @@ std::string nasal_lexer::num_gen()
|
||||||
str+=res[ptr++];
|
str+=res[ptr++];
|
||||||
column+=str.length();
|
column+=str.length();
|
||||||
if(str.length()<3)// "0o"
|
if(str.length()<3)// "0o"
|
||||||
die("invalid number:"+str);
|
die("invalid number `"+str+"`.");
|
||||||
return str;
|
return str;
|
||||||
}
|
}
|
||||||
// generate dec number
|
// generate dec number
|
||||||
|
@ -232,7 +248,7 @@ std::string nasal_lexer::num_gen()
|
||||||
if(str.back()=='.')
|
if(str.back()=='.')
|
||||||
{
|
{
|
||||||
column+=str.length();
|
column+=str.length();
|
||||||
die("invalid number:"+str);
|
die("invalid number `"+str+"`.");
|
||||||
return "0";
|
return "0";
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -247,7 +263,7 @@ std::string nasal_lexer::num_gen()
|
||||||
if(str.back()=='e' || str.back()=='E' || str.back()=='-' || str.back()=='+')
|
if(str.back()=='e' || str.back()=='E' || str.back()=='-' || str.back()=='+')
|
||||||
{
|
{
|
||||||
column+=str.length();
|
column+=str.length();
|
||||||
die("invalid number:"+str);
|
die("invalid number `"+str+"`.");
|
||||||
return "0";
|
return "0";
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
|
@ -315,7 +331,7 @@ void nasal_lexer::scan(const std::string& file)
|
||||||
std::string str;
|
std::string str;
|
||||||
while(ptr<res.size())
|
while(ptr<res.size())
|
||||||
{
|
{
|
||||||
while(ptr<res.size() && (res[ptr]==' ' || res[ptr]=='\n' || res[ptr]=='\t' || res[ptr]=='\r'))// || res[ptr]<0))
|
while(ptr<res.size() && (res[ptr]==' ' || res[ptr]=='\n' || res[ptr]=='\t' || res[ptr]=='\r' || res[ptr]==0))
|
||||||
{
|
{
|
||||||
// these characters will be ignored, and '\n' will cause ++line
|
// these characters will be ignored, and '\n' will cause ++line
|
||||||
++column;
|
++column;
|
||||||
|
@ -348,7 +364,7 @@ void nasal_lexer::scan(const std::string& file)
|
||||||
++column;
|
++column;
|
||||||
uint32_t type=get_type(str);
|
uint32_t type=get_type(str);
|
||||||
if(!type)
|
if(!type)
|
||||||
die("invalid operator:"+str);
|
die("invalid operator `"+str+"`.");
|
||||||
tokens.push_back({line,column,type,str});
|
tokens.push_back({line,column,type,str});
|
||||||
++ptr;
|
++ptr;
|
||||||
}
|
}
|
||||||
|
@ -375,8 +391,8 @@ void nasal_lexer::scan(const std::string& file)
|
||||||
else
|
else
|
||||||
{
|
{
|
||||||
++column;
|
++column;
|
||||||
++ptr;
|
char c=res[ptr++];
|
||||||
die("unknown character.");
|
die("invalid character 0x"+chrhex(c)+".");
|
||||||
}
|
}
|
||||||
}
|
}
|
||||||
tokens.push_back({line,column,tok_eof,"eof"});
|
tokens.push_back({line,column,tok_eof,"eof"});
|
||||||
|
|
|
@ -48,7 +48,7 @@ private:
|
||||||
nasal_ast root;
|
nasal_ast root;
|
||||||
nasal_err& nerr;
|
nasal_err& nerr;
|
||||||
|
|
||||||
void die(uint32_t,std::string);
|
void die(uint32_t,std::string,bool);
|
||||||
void match(uint32_t type,const char* info=nullptr);
|
void match(uint32_t type,const char* info=nullptr);
|
||||||
bool check_comma(const uint32_t*);
|
bool check_comma(const uint32_t*);
|
||||||
bool check_multi_scalar();
|
bool check_multi_scalar();
|
||||||
|
@ -117,15 +117,20 @@ void nasal_parse::compile(const nasal_lexer& lexer)
|
||||||
match(tok_semi);
|
match(tok_semi);
|
||||||
// the last expression can be recognized without semi
|
// the last expression can be recognized without semi
|
||||||
else if(need_semi_check(root.child().back()) && tokens[ptr].type!=tok_eof)
|
else if(need_semi_check(root.child().back()) && tokens[ptr].type!=tok_eof)
|
||||||
die(error_line,"expected \";\"");
|
die(error_line,"expected \";\"",true);
|
||||||
}
|
}
|
||||||
nerr.chkerr();
|
nerr.chkerr();
|
||||||
}
|
}
|
||||||
void nasal_parse::die(uint32_t line,std::string info)
|
void nasal_parse::die(uint32_t line,std::string info,bool report_prev=false)
|
||||||
{
|
{
|
||||||
int col=(int)tokens[ptr].column-(int)tokens[ptr].str.length();
|
int col=(int)tokens[ptr].column-(int)tokens[ptr].str.length();
|
||||||
if(tokens[ptr].type==tok_str)
|
if(tokens[ptr].type==tok_str)
|
||||||
col-=2; // tok_str's str has no \"
|
col-=2; // tok_str's str has no \"
|
||||||
|
if(report_prev && ptr-1>=0) // used to report lack of ',' ';'
|
||||||
|
{
|
||||||
|
line=tokens[ptr-1].line;
|
||||||
|
col=tokens[ptr-1].column+1;
|
||||||
|
}
|
||||||
nerr.err("parse",line,col<0?0:col,info);
|
nerr.err("parse",line,col<0?0:col,info);
|
||||||
}
|
}
|
||||||
void nasal_parse::match(uint32_t type,const char* info)
|
void nasal_parse::match(uint32_t type,const char* info)
|
||||||
|
@ -155,7 +160,7 @@ bool nasal_parse::check_comma(const uint32_t* panic_set)
|
||||||
for(uint32_t i=0;panic_set[i];++i)
|
for(uint32_t i=0;panic_set[i];++i)
|
||||||
if(tokens[ptr].type==panic_set[i])
|
if(tokens[ptr].type==panic_set[i])
|
||||||
{
|
{
|
||||||
die(error_line,"expected \',\' between scalars");
|
die(error_line,"expected \',\' between scalars",true);
|
||||||
return true;
|
return true;
|
||||||
}
|
}
|
||||||
return false;
|
return false;
|
||||||
|
@ -309,7 +314,7 @@ nasal_ast nasal_parse::hash()
|
||||||
if(tokens[ptr].type==tok_comma)
|
if(tokens[ptr].type==tok_comma)
|
||||||
match(tok_comma);
|
match(tok_comma);
|
||||||
else if(tokens[ptr].type==tok_id || tokens[ptr].type==tok_str)// first set of hashmember
|
else if(tokens[ptr].type==tok_id || tokens[ptr].type==tok_str)// first set of hashmember
|
||||||
die(error_line,"expected \',\' between hash members");
|
die(error_line,"expected \',\' between hash members",true);
|
||||||
else
|
else
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
@ -377,7 +382,7 @@ nasal_ast nasal_parse::args()
|
||||||
if(tokens[ptr].type==tok_comma)
|
if(tokens[ptr].type==tok_comma)
|
||||||
match(tok_comma);
|
match(tok_comma);
|
||||||
else if(tokens[ptr].type==tok_id)// first set of identifier
|
else if(tokens[ptr].type==tok_id)// first set of identifier
|
||||||
die(error_line,"expected \',\' between identifiers");
|
die(error_line,"expected \',\' between identifiers",true);
|
||||||
else
|
else
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
@ -484,7 +489,7 @@ nasal_ast nasal_parse::exprs()
|
||||||
match(tok_semi);
|
match(tok_semi);
|
||||||
// the last expression can be recognized without semi
|
// the last expression can be recognized without semi
|
||||||
else if(need_semi_check(node.child().back()) && tokens[ptr].type!=tok_rbrace)
|
else if(need_semi_check(node.child().back()) && tokens[ptr].type!=tok_rbrace)
|
||||||
die(error_line,"expected \";\"");
|
die(error_line,"expected \';\'",true);
|
||||||
}
|
}
|
||||||
match(tok_rbrace,"expected \'}\' when generating expressions");
|
match(tok_rbrace,"expected \'}\' when generating expressions");
|
||||||
}
|
}
|
||||||
|
@ -796,7 +801,7 @@ nasal_ast nasal_parse::multi_id()
|
||||||
if(tokens[ptr].type==tok_comma)
|
if(tokens[ptr].type==tok_comma)
|
||||||
match(tok_comma);
|
match(tok_comma);
|
||||||
else if(tokens[ptr].type==tok_id)// first set of identifier
|
else if(tokens[ptr].type==tok_id)// first set of identifier
|
||||||
die(error_line,"expected \',\' between identifiers");
|
die(error_line,"expected \',\' between identifiers",true);
|
||||||
else
|
else
|
||||||
break;
|
break;
|
||||||
}
|
}
|
||||||
|
|
Loading…
Reference in New Issue