--- parser3/src/main/compile.y 2001/02/21 07:31:41 1.6 +++ parser3/src/main/compile.y 2001/03/06 13:24:40 1.52 @@ -1,183 +1,304 @@ +/* + $Id: compile.y,v 1.52 2001/03/06 13:24:40 paf Exp $ +*/ + %{ -#define YYSTYPE Array/**/ * -#define YYPARSE_PARAM pc -#define YYLEX_PARAM pc -#define YYDEBUG 1 +#define YYSTYPE Array/**/ * +#define YYPARSE_PARAM pc +#define YYLEX_PARAM pc +#define YYDEBUG 1 #define YYERROR_VERBOSE -#define yyerror(msg) real_yyerror((parse_control *)pc, msg) -#define YYPRINT(file, type, value) yyprint (file, type, value) +#define yyerror(msg) real_yyerror((parse_control *)pc, msg) +#define YYPRINT(file, type, value) yyprint(file, type, value) #include #include #include #include "compile_tools.h" +#include "pa_value.h" +#include "pa_request.h" +#include "pa_vobject.h" +#include "pa_vdouble.h" -int real_yyerror (parse_control *pc, char *s); -static void yyprint (FILE *file, int type, YYSTYPE value); +#define SELF_NAME "self" +#define USES_NAME "USES" + +int real_yyerror(parse_control *pc, char *s); +static void yyprint(FILE *file, int type, YYSTYPE value); int yylex(YYSTYPE *lvalp, void *pc); -#define PC ((parse_control *)pc) +// local convinient inplace typecast & var +#define PC ((parse_control *)pc) +#define POOL *PC->pool +#undef NEW +#define NEW new(POOL) %} %pure_parser -%token END_OF_NAME +%token EON %token STRING %token BOGUS +%token LOGICAL_AND LOGICAL_OR %% -result: input { PC->result=$1 }; -input: empty | codes; +all: + one_big_piece { + String& name_main=*NEW String(POOL); + name_main.APPEND_CONST(MAIN_METHOD_NAME); + Array& param_names=*NEW Array(POOL); + Array& local_names=*NEW Array(POOL); + Method& method=*NEW Method(POOL, name_main, param_names, local_names, *$1); + PC->vclass->add_method(name_main, method); +} +| methods; + +methods: method | methods method; +one_big_piece: maybe_codes; + +method: control_method | code_method; + +control_method: '@' STRING '\n' + control_strings { + String& name=*SLA2S($2); + YYSTYPE strings_code=$4; + if(strings_code->size()<1*2) { + strcpy(PC->error, "@"); + strcat(PC->error, name.cstr()); + strcat(PC->error, " is empty"); + YYERROR; + } + if(name==CLASS_NAME) { + if(strings_code->size()==1*2) + PC->vclass->set_name(*SLA2S(strings_code)); + else { + strcpy(PC->error, "@"CLASS_NAME" must contain sole name"); + YYERROR; + } + } else { + if(name==USES_NAME) { + for(int i=0; isize(); i+=2) { + String *file=SLA2S(strings_code, i); + file->APPEND_CONST(".p"); + PC->request->use(file->cstr(), 0); + } + } else if(name==BASE_NAME) { + if(strings_code->size()==1*2) { + String& base_name=*SLA2S(strings_code); + VClass *base=static_cast( + PC->request->classes().get(base_name)); + if(!base) { + strcpy(PC->error, base_name.cstr()); + strcat(PC->error, ": undefined class in @"BASE_NAME); + YYERROR; + } + PC->vclass->set_base(*base); + } else { + strcpy(PC->error, "@"BASE_NAME" must contain sole name"); + YYERROR; + } + } else { + strcpy(PC->error, name.cstr()); + strcat(PC->error, ": invalid special name. valid names are " + CLASS_NAME", "USES_NAME" and "BASE_NAME); + YYERROR; + } + } +}; +control_strings: control_string | control_strings control_string { $$=$1; P($$, $2) }; +control_string: maybe_string '\n'; +maybe_string: empty | STRING; + +code_method: '@' STRING bracketed_maybe_strings maybe_bracketed_strings maybe_comment '\n' + maybe_codes { + const String *name=SLA2S($2); + + YYSTYPE params_names_code=$3; + Array& params_names=*NEW Array(POOL); + for(int i=0; isize(); i+=2) + params_names+=SLA2S(params_names_code, i); + + YYSTYPE locals_names_code=$4; + Array& locals_names=*NEW Array(POOL); + for(int i=0; isize(); i+=2) + locals_names+=SLA2S(locals_names_code, i); + + Method& method=*NEW Method(POOL, *name, params_names, locals_names, *$7); + PC->vclass->add_method(*name, method); +}; + +maybe_bracketed_strings: empty | bracketed_maybe_strings; +bracketed_maybe_strings: '[' maybe_strings ']' {$$=$2}; +maybe_strings: empty | strings; +strings: STRING | strings ';' STRING { $$=$1; P($$, $3) }; + +maybe_comment: empty | STRING; /* codes */ +maybe_codes: empty | codes; + codes: code | codes code { $$=$1; - P($$,$2); + P($$, $2); }; code: write_str_literal | action; action: get | put | with | call; /* get */ -get: '$' any_name { +get: '$' get_name { $$=$2; /* stack: resulting value */ - OP($$,OP_WRITE); /* value=pop; write(value) */ + OP($$, OP_WRITE); /* value=pop; write(value) */ }; - -any_name: name_without_curly_rdive END_OF_NAME | name_in_curly_rdive; - +get_name: name_without_curly_rdive EON | name_in_curly_rdive; name_in_curly_rdive: '{' name_without_curly_rdive '}' { $$=$2 }; -name_without_curly_rdive: name_rdive { - /* - TODO: подсмотреть в $1, и если там в первом элементе первая буква ":" - то выкинуть её и делать не OP_WITH_READ, а WITH_ROOT - TODO: подсмотреть в $1, и если там первым элементом self, - то выкинуть его и делать не OP_WITH_READ, а WITH_SELF - */ - $$=N(PC->pool); OP($$, OP_WITH_READ); /* stack: starting context */ - P($$,$1); /* diving code; stack: current context */ +name_without_curly_rdive: + name_without_curly_rdive_read +| name_without_curly_rdive_root +| name_without_curly_rdive_class; +name_without_curly_rdive_read: name_without_curly_rdive_code { + $$=N(POOL); + Array *diving_code=$1; + String *first_name=SLA2S(diving_code); + if(first_name && *first_name==SELF_NAME) { + OP($$, OP_WITH_SELF); /* stack: starting context */ + P($$, diving_code, + /* skip over... */ + diving_code->size()>2?3/*OP_+string+get_element*/:2/*OP_+string*/); + } else { + OP($$, OP_WITH_READ); /* stack: starting context */ + P($$, diving_code); + } + /* diving code; stack: current context */ }; -name_rdive: name_advance2 | name_path name_advance2 { $$=$1; P($$,$2) } +name_without_curly_rdive_root: ':' name_without_curly_rdive_code { + $$=N(POOL); + OP($$, OP_WITH_ROOT); /* stack: starting context */ + P($$, $2); /* diving code; stack: current context */ +}; +name_without_curly_rdive_class: class_prefix name_without_curly_rdive_code { $$=$1; P($$, $2) }; +name_without_curly_rdive_code: name_advance2 | name_path name_advance2 { $$=$1; P($$, $2) }; /* put */ -put: '$' name_expr_dive '(' constructor_value ')' { -/* - TODO: подсмотреть в $3, и если там в первом элементе первая буква ":" - то выкинуть её и делать не OP_WITH_OP_WRITE, а WITH_ROOT - TODO: подсмотреть в $3, и если там первым элементом self, - то выкинуть его и делать не OP_WITH_OP_WRITE, а WITH_SELF - если ничего не осталось - $self(xxx) - обругать -*/ - $$=N(PC->pool); - OP($$, OP_WITH_WRITE); /* stack: starting context */ - P($$,$2); /* diving code; stack: context,name */ - P($$,$4); /* stack: context,name,constructor_value */ - OP($$,OP_CONSTRUCT); /* value=pop; name=pop; context=pop; construct(context,name,value) */ +put: '$' name_expr_wdive constructor_value { + $$=$2; /* stack: context,name */ + P($$, $3); /* stack: context,name,constructor_value */ + OP($$, OP_CONSTRUCT); /* value=pop; name=pop; context=pop; construct(context,name,value) */ +}; +name_expr_wdive: + name_expr_wdive_write +| name_expr_wdive_root +| name_expr_wdive_class; +name_expr_wdive_write: name_expr_dive_code { + $$=N(POOL); + Array *diving_code=$1; + String *first_name=SLA2S(diving_code); + if(first_name && *first_name==SELF_NAME) { + OP($$, OP_WITH_SELF); /* stack: starting context */ + P($$, diving_code, + /* skip over... */ + diving_code->size()>2?3/*OP_+string+get_element*/:2/*OP_+string*/); + } else { + OP($$, OP_WITH_WRITE); /* stack: starting context */ + P($$, diving_code); + } + /* diving code; stack: current context */ +}; +name_expr_wdive_root: ':' name_expr_dive_code { + $$=N(POOL); + OP($$, OP_WITH_ROOT); /* stack: starting context */ + P($$, $2); /* diving code; stack: context,name */ }; +name_expr_wdive_class: class_prefix name_expr_dive_code { $$=$1; P($$, $2) }; + constructor_value: - constructor_one_param_value -| constructor_two_params_value /* $var(=;2*2) $var(%d;2*2) $var(+;1) */ + '[' constructor_code_value ']' { $$=$2 } +| '(' constructor_expression_value ')' { $$=$2 } ; -constructor_one_param_value: - empty_value /* optimized $var() case */ -| STRING /* optimized $var(STRING) case */ -| complex_constructor_param_value /* $var(something complex) */ +constructor_code_value: + empty_value /* optimized $var[] case */ +| STRING /* optimized $var[STRING] case */ +| complex_constructor_code_value /* $var[something complex] */ ; -empty_value: empty; -complex_constructor_param_value: complex_constructor_param_body { - $$=N(PC->pool); +complex_constructor_code_value: complex_constructor_code { + $$=N(POOL); OP($$, OP_CREATE_EWPOOL); /* stack: empty write context */ - P($$,$1); /* some codes to that context */ - OP($$,OP_REDUCE_EWPOOL); /* context=pop; stack: context.value() */ + P($$, $1); /* some codes to that context */ + OP($$, OP_REDUCE_EWPOOL); /* context=pop; stack: context.value() */ }; -complex_constructor_param_body: - codes__excluding_sole_str_literal -| codes__str__followed_by__excluding_sole_str_literal +complex_constructor_code: codes__excluding_sole_str_literal; +codes__excluding_sole_str_literal: action | code codes { $$=$1; P($$, $2) }; + +constructor_expression_value: + empty_value /* optimized $var() case */ +| STRING /* optimized $var(STRING) case */ +;/*| complex_constructor_expression_value /* $var(something complex) * / ; -constructor_two_params_value: STRING ';' constructor_one_param_value { - const String *operator_or_fmtS=LA2S($1); - char *operator_or_fmt=operator_or_fmtS->cstr(); - $$=N(PC->pool); - P($$, $1);/* stack: ncontext name operator_or_fmt */ - P($$, $3); /* stack: ncontext name operator_or_fmt expr */ - switch(operator_or_fmt[0]) { - case '=': case '%': - OP($$, OP_EXPRESSION_EVAL); - break; - case '+': case '-': case '*': case '/': - OP($$, OP_MODIFY_EVAL); - break; - default: - strcpy(PC->error, "invalid modification operator"); - YYERROR; - } - /* stack: ncontext name value */ +complex_constructor_expression_value: complex_constructor_expression { + $$=N(POOL); + OP($$, OP_CREATE_SWPOOL); /* stack: empty write context * / + P($$, $1); /* some codes to that context * / + OP($$, OP_REDUCE_SWPOOL); /* context=pop; stack: context.get_string() * / }; - +complex_constructor_expression: +; +*/ /* call */ -call: '^' name_expr_dive store_params END_OF_NAME { /* ^field.$method{vasya} */ -/* - TODO: подсмотреть в $3, и если там в первом элементе первая буква ":" - то выкинуть её и делать не OP_WITH_READ, а WITH_ROOT - TODO: подсмотреть в $3, и если там первым элементом self, - то выкинуть его и делать не OP_WITH_READ, а WITH_SELF - TODO: - если первым в $3 идёт result - то - выкинуть его - если там ещё что-то осталось, - то - не OP_WITH_READ, а WITH_RESULT - иначе // ^result(value) - обругать безобразие -*/ - $$=N(PC->pool); - OP($$, OP_WITH_READ); /* stack: starting context */ - P($$,$2); /* diving code; stack: context,method_name */ - OP($$,OP_GET_METHOD_FRAME); /* stack: context,method_frame */ - P($$,$3); /* filling method_frame.store_params */ - OP($$,OP_CALL); /* method_frame=pop; ncontext=pop; call(ncontext,method_frame) */ +call: '^' call_name store_params EON { /* ^field.$method{vasya} */ + $$=$2; /* with_xxx,diving code; stack: context,method_junction */ + OP($$, OP_GET_METHOD_FRAME); /* stack: context,method_frame */ + P($$, $3); /* filling method_frame.store_params */ + OP($$, OP_CALL); /* method_frame=pop; ncontext=pop; call(ncontext,method_frame) */ }; -store_params: store_param | store_params store_param { $$=$1; P($$,$2) }; +call_name: name_without_curly_rdive; + +store_params: store_param | store_params store_param { $$=$1; P($$, $2) }; store_param: store_round_param | store_curly_param; -store_round_param: '(' store_param_parts ')' {$$=$2}; -store_param_parts: store_param_part | store_param_parts ';' store_param_part { $$=$1; P($$,$3) }; -store_param_part: constructor_one_param_value { +store_round_param: '[' store_param_parts ']' {$$=$2}; +store_param_parts: + store_param_part +| store_param_parts ';' store_param_part { $$=$1; P($$, $3) } +; +store_curly_param: '{' maybe_codes '}' { + $$=N(POOL); + PCA($$, $2); + OP($$, OP_STORE_PARAM); +}; +store_param_part: + empty /* optimized () case */ +| STRING { /* optimized (STRING) case */ $$=$1; - OP($$,OP_STORE_PARAM); + OP($$, OP_STORE_PARAM); } -store_curly_param: '{' input '}' { - $$=N(PC->pool); - OP($$, OP_CODE_ARRAY); - AA($$,$2); - OP($$,OP_CREATE_JUNCTION); - OP($$,OP_STORE_PARAM); -}; +| complex_constructor_code_value { /* (something complex) */ + $$=$1; + OP($$, OP_STORE_PARAM); +} +; /* name */ -name_expr_dive: name_expr_value | name_path name_expr_value { $$=$1; P($$,$2) }; +name_expr_dive_code: name_expr_value | name_path name_expr_value { $$=$1; P($$, $2) }; -name_path: name_step | name_path name_step { $$=$1; P($$,$2) }; +name_path: name_step | name_path name_step { $$=$1; P($$, $2) }; name_step: name_advance1 '.'; name_advance1: name_expr_value { /* stack: context */ $$=$1; /* stack: context,name */ - OP($$,OP_GET_ELEMENT); /* name=pop; context=pop; stack: context.get_element(name) */ + OP($$, OP_GET_ELEMENT); /* name=pop; context=pop; stack: context.get_element(name) */ }; name_advance2: name_expr_value { /* stack: context */ $$=$1; /* stack: context,name */ - OP($$,OP_GET_ELEMENT); /* name=pop; context=pop; stack: context.get_element(name) */ + OP($$, OP_GET_ELEMENT); /* name=pop; context=pop; stack: context.get_element(name) */ } | STRING BOGUS ; @@ -188,28 +309,44 @@ name_expr_value: ; name_expr_subvar_value: '$' subvar_ref_name_rdive { $$=$2; - OP($$,OP_GET_ELEMENT); + OP($$, OP_GET_ELEMENT); }; name_expr_with_subvar_value: STRING subvar_get_writes { - $$=N(PC->pool); + $$=N(POOL); OP($$, OP_CREATE_EWPOOL); - P($$,$1); - OP($$,OP_WRITE); - P($$,$2); - OP($$,OP_REDUCE_EWPOOL); + P($$, $1); + OP($$, OP_WRITE); + P($$, $2); + OP($$, OP_REDUCE_EWPOOL); +}; +subvar_ref_name_rdive: subvar_ref_name_rdive_read | subvar_ref_name_rdive_root; +subvar_ref_name_rdive_read: STRING { + $$=N(POOL); + OP($$, OP_WITH_READ); + P($$, $1); +}; +subvar_ref_name_rdive_root: ':' STRING { + $$=N(POOL); + OP($$, OP_WITH_ROOT); + P($$, $2); }; -subvar_ref_name_rdive: STRING { -/* - TODO: подсмотреть в $1, и если там в первом элементе первая буква ":" - то выкинуть её и делать не OP_WITH_READ, а WITH_ROOT -*/ - $$=N(PC->pool); OP($$, OP_WITH_READ); - P($$,$1); -}; -subvar_get_writes: subvar__get_write | subvar_get_writes subvar__get_write { $$=$1; P($$,$2) }; +subvar_get_writes: subvar__get_write | subvar_get_writes subvar__get_write { $$=$1; P($$, $2) }; subvar__get_write: '$' subvar_ref_name_rdive { $$=$2; - OP($$,OP_GET_ELEMENT__WRITE); + OP($$, OP_GET_ELEMENT__WRITE); +}; + +class_prefix: STRING ':' { + String& name=*SLA2S($1); + VClass *vclass=static_cast(PC->request->classes().get(name)); + if(!vclass) { + strcpy(PC->error, "'"); + strcat(PC->error, name.cstr()); + strcat(PC->error, "' class is undefined in call"); + YYERROR; + } + //TODO: убрать зависимость от статических @USE, сделать имя, а не ссылку + $$=CL(vclass); // vclass }; @@ -217,48 +354,38 @@ subvar__get_write: '$' subvar_ref_name_r with: '$' name_without_curly_rdive '{' codes '}' { $$=$2; - OP($$,OP_CREATE_RWPOOL); - P($$,$4); - OP($$,OP_REDUCE_RWPOOL); - OP($$,OP_WRITE); + OP($$, OP_CREATE_RWPOOL); + P($$, $4); + OP($$, OP_REDUCE_RWPOOL); + OP($$, OP_WRITE); }; -/* codes_in_brackets */ +/* basics */ -codes__str__followed_by__excluding_sole_str_literal: - write_str_literal codes__excluding_sole_str_literal { - $$=$1; - P($$,$2); -} -; -codes__excluding_sole_str_literal: - action -| codes__excluding_sole_str_literal write_str_literal { - $$=$1; - P($$,$2); -} -; write_str_literal: STRING { - $$=$1; - OP($$,OP_WRITE); + if(SLA2S($1)->size()) { + $$=$1; + OP($$, OP_WRITE); + } else { + // optimized case of special end of macro. see yylex + $$=N(POOL); + } }; - -/* */ - -empty: /* empty */ { $$=N(PC->pool) }; +empty_value: /* empty */ { $$=SL(NEW VString(POOL)) }; +empty: /* empty */ { $$=N(POOL) }; %% /* 000$111(2222)00 000$111{3333}00 - $,^: push, =0 + $,^: push,=0 1:( { break=pop 2:( ) pop 3:{ } pop 000^111(2222)4444{33333}4000 - $,^: push, =0 + $,^: push,=0 1:( { break=pop 2:( )=4 3:{ }=4 @@ -267,11 +394,10 @@ empty: /* empty */ { $$=N(PC->pool) }; int yylex(YYSTYPE *lvalp, void *pc) { #define lexical_brackets_nestage PC->brackets_nestages[PC->sp] + #define RC {result=c; goto break2; } register int c; int result; - char *start; - int start_line; if(PC->pending_state) { result=PC->pending_state; @@ -279,257 +405,397 @@ int yylex(YYSTYPE *lvalp, void *pc) { return result; } - start=PC->source; - start_line=PC->line; - while(1) { - c=*PC->source++; + char *begin=PC->source; + char *end; + int begin_line=PC->line; + while(true) { + c=*(end=(PC->source++)); if(c=='\n') { PC->line++; - PC->col=1; - } + PC->col=0; + } else PC->col++; - /* escaping: ^^ ^$ ^; ^) ^} ^( ^{ */ - if(c=='^') { - char pending_c=*PC->source; - - if(pending_c == '^' || pending_c == '$' || pending_c == ';' || - pending_c == '(' || pending_c == ')' || - pending_c == '{' || pending_c == '}') { - /* append piece till ^ */ - PC->string->APPEND(start, PC->source-start -1/*^*/, PC->file, start_line); - /* reset piece 'start' position & line */ - start=PC->source+1/*^*/; - start_line=PC->line; - /* skip over ^ and _ */ - PC->source+=2; - /* skip analysis = forced literal */ + // escaping: ^^ ^$ ^; ^) ^} ^( ^{ ^" + if(c=='^') + switch(*PC->source) { + case '^': case '$': case ';': + case '[': case ']': + case '{': case '}': + case '"': + if(end!=begin) { + // append piece till ^ + PC->string->APPEND(begin, end-begin, PC->file, begin_line); + } + // reset piece 'start' position & line + begin=PC->source; // ^ + begin_line=PC->line; + // skip over ^ and _ + PC->source++; PC->col++; + // skip analysis = forced literal continue; } - } switch(PC->ls) { + + // USER'S = NOT OURS case LS_USER: - if(c=='$') { - push_LS(PC); PC->ls=LS_VAR_NAME_SIMPLE; - result=c; - goto break2; + switch(c) { + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case '@': + if(PC->col==0+1) { + push_LS(PC, LS_DEF_NAME); + RC; + } + break; } - if(c=='^') { - push_LS(PC); PC->ls=LS_METHOD_NAME; - result=c; - goto break2; + break; + + // STRING IN EXPRESSION + case LS_EXPRESSION_STRING: + switch(c) { + case '"': + pop_LS(PC); //"abc". + RC; + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; } break; - /* VAR */ - case LS_VAR_NAME_SIMPLE: - if(c==0 || - c==' '|| c=='\t' || c=='\n' || - c==')' || c=='}') { - pop_LS(PC); - PC->source--; PC->col--; - result=END_OF_NAME; - goto break2; + // METHOD DEFINITION + case LS_DEF_NAME: + switch(c) { + case '[': + PC->ls=LS_DEF_PARAMS; + RC; + case '\n': + PC->ls=LS_DEF_SPECIAL_BODY; + RC; } - if(PC->source==start && c=='{') { /* ${name}, no need of END_OF_NAME, switching LS */ - PC->ls=LS_VAR_NAME_CURLY; - result=c; - goto break2; - } - if(c=='(') { - PC->ls=LS_VAR_ROUND; - lexical_brackets_nestage=1; - result=c; - goto break2; - } - if(c=='{') { - PC->ls=LS_VAR_CURLY; - lexical_brackets_nestage=1; - result=c; - goto break2; - } - if(c=='.'/* name part delim */ || c=='$'/* name part subvar */) { - result=c; - goto break2; + break; + + case LS_DEF_PARAMS: + switch(c) { + case ';': + RC; + case ']': + PC->ls=*PC->source=='['?LS_DEF_LOCALS:LS_DEF_COMMENT; + RC; + case '\n': // wrong. bailing out + pop_LS(PC); + RC; } break; - case LS_VAR_NAME_CURLY: - if(c=='}') { /* ${name} finished, restoring LS */ + + case LS_DEF_LOCALS: + switch(c) { + case '[': + case ';': + RC; + case ']': + PC->ls=LS_DEF_COMMENT; + RC; + case '\n': // wrong. bailing out pop_LS(PC); - result=c; - goto break2; + RC; } - if(c=='.'/* name part delim */ || c=='$'/*name part subvar*/) { - result=c; - goto break2; + break; + + case LS_DEF_COMMENT: + if(c=='\n') { + pop_LS(PC); + RC; } break; - case LS_VAR_ROUND: - if(c=='$') { - push_LS(PC); PC->ls=LS_VAR_NAME_SIMPLE; - result=c; - goto break2; + + case LS_DEF_SPECIAL_BODY: + if(c=='\n') { + switch(*PC->source) { + case '@': case 0: // end of special_code + pop_LS(PC); + break; + } + RC; } - if(c=='^') { - push_LS(PC); PC->ls=LS_METHOD_NAME; - result=c; - goto break2; + break; + + // (EXPRESSION) + case LS_EXPRESSION_BODY: + switch(c) { + case ')': + if(--lexical_brackets_nestage==0) + pop_LS(PC); //(EXPRESSION). + RC; + case '$': + push_LS(PC, LS_VAR_NAME_IN_EXPRESSION); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case '(': + lexical_brackets_nestage++; + RC; + case '+': case '-': case '*': case '/': case '%': + case '&': case '|': + case '<': case '>': case '=': case '!': + case ';': + RC; + case '"': + push_LS(PC, LS_EXPRESSION_STRING); + RC; + case 'l': case 'g': case 'e': case 'n': + if(end==begin) // right after whitespace + switch(char next_c=*PC->source) { +// case '?': // ok [and bad cases, yacc would bark at them] + case 't': // lt gt [et nt] + case 'e': // le ge ne [ee] + case 'q': // eq [lq gq nq] + PC->source++; PC->col++; + PC->pending_state=next_c; + return c; + } + break; + case ' ': case '\t': case '\n': + if(end!=begin) { + // append piece till whitespace + PC->string->APPEND(begin, end-begin, PC->file, begin_line); + } + // reset piece 'start' position & line + begin=PC->source; // after whitespace + begin_line=PC->line; + continue; } - if(c==')') { - if(--lexical_brackets_nestage==0) { + break; + + // VARIABLE GET/PUT/WITH + case LS_VAR_NAME_SIMPLE: + case LS_VAR_NAME_IN_EXPRESSION: + if(PC->ls==LS_VAR_NAME_IN_EXPRESSION) { + // name in expression ends also before binary operators + switch(c) { + case '+': case '-': case '*': case '/': case '%': + case '&': case '|': + case '<': case '>': case '=': case '!': pop_LS(PC); - result=c; + PC->source--; if(--PC->col<0) { PC->line--; PC->col=-1; } + result=EON; goto break2; } } - if(c==';'/* operator_or_fmt;value delim */) { - result=c; + switch(c) { + case 0: + case ' ': case '\t': case '\n': + case ';': + case ']': case '}': + pop_LS(PC); + PC->source--; if(--PC->col<0) { PC->line--; PC->col=-1; } + result=EON; goto break2; + case '[': + PC->ls=LS_VAR_SQUARE; + lexical_brackets_nestage=1; + RC; + case '{': + if(begin==end) { // ${name}, no need of EON, switching LS + PC->ls=LS_VAR_NAME_CURLY; + } else { + PC->ls=LS_VAR_CURLY; + lexical_brackets_nestage=1; + } + + RC; + case '(': + PC->ls=LS_EXPRESSION_BODY; + lexical_brackets_nestage=1; + RC; + case '.': // name part delim + case '$': // name part subvar + case ':': // ':name' or 'class:name' + RC; } - if(c=='(') - lexical_brackets_nestage++; break; - case LS_VAR_CURLY: - if(c=='$') { - push_LS(PC); PC->ls=LS_VAR_NAME_SIMPLE; - result=c; - goto break2; + + case LS_VAR_NAME_CURLY: + switch(c) { + case '}': // ${name} finished, restoring LS + pop_LS(PC); + RC; + case '.': // name part delim + case '$': // name part subvar + case ':': // ':name' or 'class:name' + RC; } - if(c=='^') { - push_LS(PC); PC->ls=LS_METHOD_NAME; - result=c; - goto break2; + break; + + case LS_VAR_SQUARE: + switch(c) { + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case ']': + if(--lexical_brackets_nestage==0) { + pop_LS(PC); + RC; + } + break; + case ';': // operator_or_fmt;value delim + RC; + case '[': + lexical_brackets_nestage++; + break; } - if(c=='}') + break; + + case LS_VAR_CURLY: + switch(c) { + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case '}': if(--lexical_brackets_nestage==0) { pop_LS(PC); - result=c; - goto break2; + RC; } - if(c=='{') + break; + case '{': lexical_brackets_nestage++; + break; + } break; - /* METHOD */ + // METHOD CALL case LS_METHOD_NAME: - if(c=='(') { - PC->ls=LS_METHOD_ROUND; + switch(c) { + case '[': + PC->ls=LS_METHOD_SQUARE; lexical_brackets_nestage=1; - result=c; - goto break2; - } - if(c=='{') { + RC; + case '{': PC->ls=LS_METHOD_CURLY; lexical_brackets_nestage=1; - result=c; - goto break2; - } - if(c=='.'/* name part delim */ || c=='$'/* name part subvar */) { - result=c; - goto break2; + RC; + case '.': // name part delim + case '$': // name part subvar + case ':': // ':name' or 'class:name' + RC; } break; - case LS_METHOD_ROUND: - if(c=='$') { - push_LS(PC); PC->ls=LS_VAR_NAME_SIMPLE; - result=c; - goto break2; - } - if(c=='^') { - push_LS(PC); PC->ls=LS_METHOD_NAME; - result=c; - goto break2; - } - if(c==';'/* param delim */) { - result=c; - goto break2; - } - if(c==')') + + case LS_METHOD_SQUARE: + switch(c) { + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case ';': // param delim + RC; + case ']': if(--lexical_brackets_nestage==0) { PC->ls=LS_METHOD_AFTER; - result=c; - goto break2; + RC; } - if(c=='(') + break; + case '[': lexical_brackets_nestage++; + break; + } break; + case LS_METHOD_CURLY: - if(c=='$') { - push_LS(PC); PC->ls=LS_VAR_NAME_SIMPLE; - result=c; - goto break2; - } - if(c=='^') { - push_LS(PC); PC->ls=LS_METHOD_NAME; - result=c; - goto break2; - } - if(c=='}') + switch(c) { + case '$': + push_LS(PC, LS_VAR_NAME_SIMPLE); + RC; + case '^': + push_LS(PC, LS_METHOD_NAME); + RC; + case '}': if(--lexical_brackets_nestage==0) { PC->ls=LS_METHOD_AFTER; - result=c; - goto break2; + RC; } - if(c=='{') + break; + case '{': lexical_brackets_nestage++; + break; + } break; + case LS_METHOD_AFTER: - if(c=='(') {/* )( }( */ - PC->ls=LS_METHOD_ROUND; + if(c=='[') {/* )( }( */ + PC->ls=LS_METHOD_SQUARE; lexical_brackets_nestage=1; - result=c; - goto break2; + RC; } if(c=='{') {/* ){ }{ */ PC->ls=LS_METHOD_CURLY; lexical_brackets_nestage=1; - result=c; - goto break2; + RC; } pop_LS(PC); - PC->source--; PC->col--; - result=END_OF_NAME; + PC->source--; if(--PC->col<0) { PC->line--; PC->col=-1; } + result=EON; goto break2; } - if (c == 0) { + if(c==0) { result=-1; - PC->source--; PC->col--; break; } } break2: - if(PC->source-1<=start) + if(begin==end) return result; else { PC->pending_state=result; - /* append last piece */ - PC->string->APPEND(start, PC->source-start-1, PC->file, start_line/*, start_col*/); - /* create STRING value: array of OP_STRING+string */ - *lvalp=L(PC->string); - /* new pieces storage */ - PC->string=new(*PC->pool) String(*PC->pool); - /* go */ + // strip last \n before LS_DEF_NAME or EOF + if((c=='@' || c==0) && end[-1]=='\n') + end--; + if(end!=begin) { + // append last piece + PC->string->APPEND(begin, end-begin, PC->file, begin_line/*, start_col*/); + } + // create STRING value: array of OP_VALUE+vstring + *lvalp=SL(NEW VString(*PC->string)); + // new pieces storage + PC->string=NEW String(POOL); + // go! return STRING; } } -int real_yyerror (parse_control *pc, char *s) /* Called by yyparse on error */ +int real_yyerror(parse_control *pc, char *s) /* Called by yyparse on error */ { - fprintf (stderr, "[%s]\n", s); + //fprintf(stderr, "[%s]\n", s); - s[MAX_STRING-1]=0; strcpy(pc->error, s); + strncpy(pc->error, s, MAX_STRING); // TODO: перепроверить с треклятым последним байтом return 1; } static void - yyprint ( + yyprint( FILE *file, int type, YYSTYPE value) { - if (type == STRING) - fprintf (file, " \"%s\"", LA2S(value)->cstr()); + if(type==STRING) + fprintf(file, " \"%s\"", SLA2S(value)->cstr()); }