--- parser3/src/main/compile.y 2001/03/08 13:13:40 1.76 +++ parser3/src/main/compile.y 2001/03/19 17:42:14 1.106 @@ -1,13 +1,30 @@ -/* - $Id: compile.y,v 1.76 2001/03/08 13:13:40 paf Exp $ +/** @file + Parser: compiler(lexical parser and grammar). + + Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) + + Author: Alexander Petrosyan (http://design.ru/paf) + + $Id: compile.y,v 1.106 2001/03/19 17:42:14 paf Exp $ +*/ + +/** + @todo parser4: + - cache compiled code from request to request. to do that... + -#: make method definitions, @CLASS, @BASE, @USE instructions, + which would be executed afterwards, and actions + now performed at compile time would be delayed to run time. + -#: make cache expiration on time and on disk-change of class source + -#: in apache use subpools for compiled class storage + -#: in iis make up specialized Pool object for that */ %{ -#define YYSTYPE Array/**/ * +#define YYSTYPE Array/**/ * #define YYPARSE_PARAM pc #define YYLEX_PARAM pc #define YYDEBUG 1 -#define YYERROR_VERBOSE +#define YYERROR_VERBOSE 1 #define yyerror(msg) real_yyerror((parse_control *)pc, msg) #define YYPRINT(file, type, value) yyprint(file, type, value) @@ -20,9 +37,10 @@ #include "pa_request.h" #include "pa_vobject.h" #include "pa_vdouble.h" +#include "pa_globals.h" -#define SELF_NAME "self" -#define USE_NAME "USE" +#define SELF_ELEMENT_NAME "self" +#define USE_CONTROL_METHOD_NAME "USE" int real_yyerror(parse_control *pc, char *s); static void yyprint(FILE *file, int type, YYSTYPE value); @@ -34,6 +52,7 @@ int yylex(YYSTYPE *lvalp, void *pc); #define POOL *PC->pool #undef NEW #define NEW new(POOL) +#ifndef DOXYGEN_SHOULD_SKIP_THIS %} %pure_parser @@ -63,8 +82,10 @@ int yylex(YYSTYPE *lvalp, void *pc); %token DEF "def" %token IN "in" %token FEXISTS "-f" +%token IS "is" /* logical */ +%left "is" %left "lt" "gt" "le" "ge" %left "eq" "ne" %left '<' '>' "<=" ">=" "##" @@ -85,17 +106,14 @@ int yylex(YYSTYPE *lvalp, void *pc); %left NEG /* negation: unary - */ %% - -all: /* TODO: у ^execute непременно задать какой-то name, см. 'RUN' */ +all: one_big_piece { - String& MAIN=*NEW String(POOL); - MAIN.APPEND_CONST(MAIN_METHOD_NAME); Method& method=*NEW Method(POOL, - MAIN, - 0, /*numbered_params_count*/ + *main_method_name, + 0, 0, /*min, max numbered_params_count*/ 0/*param_names*/, 0/*local_names*/, $1/*parser_code*/, 0/*native_code*/); - PC->vclass->add_method(MAIN, method); + PC->cclass->add_method(*main_method_name, method); } | methods; @@ -106,7 +124,7 @@ method: control_method | code_method; control_method: '@' STRING '\n' control_strings { - String& command=*SLA2S($2); + const String& command=*SLA2S($2); YYSTYPE strings_code=$4; if(strings_code->size()<1*2) { strcpy(PC->error, "@"); @@ -115,42 +133,43 @@ control_method: '@' STRING '\n' YYERROR; } if(command==CLASS_NAME) { - if(PC->vclass!=&PC->request->root_class) { // already changed from default? + if(PC->cclass!=&PC->request->ROOT) { // already changed from default? strcpy(PC->error, "class already have a name '"); - strncat(PC->error, PC->vclass->name().cstr(), 100); + strncat(PC->error, PC->cclass->name().cstr(), 100); strcat(PC->error, "'"); YYERROR; } if(strings_code->size()==1*2) { // new class' name - String *name=SLA2S(strings_code); + const String *name=SLA2S(strings_code); // creating the class - PC->vclass=NEW VClass(POOL); - PC->vclass->set_name(*name); + PC->cclass=NEW VClass(POOL); + PC->cclass->set_name(*name); // defaulting base. may change with @BASE - PC->vclass->set_base(PC->request->root_class); + PC->cclass->set_base(PC->request->ROOT); // append to request's classes - PC->request->classes_array()+=PC->vclass; - PC->request->classes().put(*name, PC->vclass); + PC->request->classes().put(*name, PC->cclass); } else { strcpy(PC->error, "@"CLASS_NAME" must contain sole name"); YYERROR; } } else { - if(command==USE_NAME) { + if(command==USE_CONTROL_METHOD_NAME) { for(int i=0; isize(); i+=2) { - String *file=SLA2S(strings_code, i); - file->APPEND_CONST(".p"); - PC->request->use(file->cstr(), 0); + String file(*SLA2S(strings_code, i)); + file.APPEND_CONST(".p"); + PC->request->use_file(file.cstr()); } } else if(command==BASE_NAME) { - if(PC->vclass->base()!=&PC->request->root_class) { // already changed from default? - strcpy(PC->error, "there must be only one @"BASE_NAME); + if(PC->cclass->base()!=&PC->request->ROOT) { // already changed from default? + strcpy(PC->error, "class already have a base '"); + strncat(PC->error, PC->cclass->base()->name().cstr(), 100); + strcat(PC->error, "'"); YYERROR; } if(strings_code->size()==1*2) { // TODO: преодолеть self и циклические base - String& base_name=*SLA2S(strings_code); + const String& base_name=*SLA2S(strings_code); VClass *base=static_cast( PC->request->classes().get(base_name)); if(!base) { @@ -158,15 +177,16 @@ control_method: '@' STRING '\n' strcat(PC->error, ": undefined class in @"BASE_NAME); YYERROR; } - PC->vclass->set_base(*base); + PC->cclass->set_base(*base); } else { strcpy(PC->error, "@"BASE_NAME" must contain sole name"); YYERROR; } } else { - strcpy(PC->error, command.cstr()); - strcat(PC->error, ": invalid special name. valid names are " - CLASS_NAME", "USE_NAME" and "BASE_NAME); + strcpy(PC->error, "'"); + strncat(PC->error, command.cstr(), MAX_STRING/2); + strcat(PC->error, "' invalid special name. valid names are " + "'"CLASS_NAME"', '"USE_CONTROL_METHOD_NAME"' and '"BASE_NAME"'"); YYERROR; } } @@ -197,10 +217,10 @@ code_method: '@' STRING bracketed_maybe_ Method& method=*NEW Method(POOL, *name, - 0/*numbered_params_count*/, + 0, 0/*min,max numbered_params_count*/, params_names, locals_names, $7, 0); - PC->vclass->add_method(*name, method); + PC->cclass->add_method(*name, method); }; maybe_bracketed_strings: empty | bracketed_maybe_strings; @@ -214,18 +234,15 @@ maybe_comment: empty | STRING; maybe_codes: empty | codes; -codes: code | codes code { - $$=$1; - P($$, $2); -}; -code: write_str_literal | action; +codes: code | codes code { $$=$1; P($$, $2) }; +code: write_string | action; action: get | put | with | call; /* get */ get: get_value { $$=$1; /* stack: resulting value */ - O($$, OP_WRITE); /* value=pop; wcontext.write(value) */ + O($$, OP_WRITE_VALUE); /* value=pop; wcontext.write(value) */ }; get_value: '$' get_name_value { $$=$2 } get_name_value: name_without_curly_rdive EON | name_in_curly_rdive; @@ -237,8 +254,8 @@ name_without_curly_rdive: name_without_curly_rdive_read: name_without_curly_rdive_code { $$=N(POOL); Array *diving_code=$1; - String *first_name=SLA2S(diving_code); - if(first_name && *first_name==SELF_NAME) { + const String *first_name=SLA2S(diving_code); + if(first_name && *first_name==SELF_ELEMENT_NAME) { O($$, OP_WITH_SELF); /* stack: starting context */ P($$, diving_code, /* skip over... */ @@ -259,10 +276,9 @@ name_without_curly_rdive_code: name_adva /* put */ -put: '$' name_expr_wdive constructor_value { +put: '$' name_expr_wdive construct { $$=$2; /* stack: context,name */ P($$, $3); /* stack: context,name,constructor_value */ - O($$, OP_CONSTRUCT); /* value=pop; name=pop; context=pop; construct(context,name,value) */ }; name_expr_wdive: name_expr_wdive_write @@ -271,8 +287,8 @@ name_expr_wdive: name_expr_wdive_write: name_expr_dive_code { $$=N(POOL); Array *diving_code=$1; - String *first_name=SLA2S(diving_code); - if(first_name && *first_name==SELF_NAME) { + const String *first_name=SLA2S(diving_code); + if(first_name && *first_name==SELF_ELEMENT_NAME) { O($$, OP_WITH_SELF); /* stack: starting context */ P($$, diving_code, /* skip over... */ @@ -290,9 +306,16 @@ name_expr_wdive_root: ':' name_expr_dive }; name_expr_wdive_class: class_prefix name_expr_dive_code { $$=$1; P($$, $2) }; -constructor_value: - '[' any_constructor_code_value ']' { $$=$2 } -| '(' any_expr ')' { $$=$2 } +construct: construct_by_code | construct_by_expr; +construct_by_code: '[' any_constructor_code_value ']' { + $$=$2; /* stack: context, name, value */ + O($$, OP_CONSTRUCT_VALUE); /* value=pop; name=pop; context=pop; construct(context,name,value) */ +} +; +construct_by_expr: '(' expr_value ')' { + $$=$2; /* stack: context, name, value */ + O($$, OP_CONSTRUCT_EXPR); /* value=pop; name=pop; context=pop; construct(context,name,value) */ +} ; any_constructor_code_value: empty_string_value /* optimized $var[] case */ @@ -312,7 +335,7 @@ codes__excluding_sole_str_literal: actio call: call_value { $$=$1; /* stack: value */ - O($$, OP_WRITE); /* value=pop; wcontext.write(value) */ + O($$, OP_WRITE_VALUE); /* value=pop; wcontext.write(value) */ }; call_value: '^' call_name store_params EON { /* ^field.$method{vasya} */ $$=$2; /* with_xxx,diving code; stack: context,method_junction */ @@ -331,10 +354,7 @@ store_param: ; store_square_param: '[' store_code_param_parts ']' {$$=$2}; store_round_param: '(' store_expr_param_parts ')' {$$=$2}; -store_curly_param: '{' maybe_codes '}' { - $$=N(POOL); - PCA($$, $2); -}; +store_curly_param: '{' store_curly_param_parts '}' {$$=$2}; store_code_param_parts: store_code_param_part | store_code_param_parts ';' store_code_param_part { $$=$1; P($$, $3) } @@ -343,23 +363,32 @@ store_expr_param_parts: store_expr_param_part | store_expr_param_parts ';' store_expr_param_part { $$=$1; P($$, $3) } ; +store_curly_param_parts: + store_curly_param_part +| store_curly_param_parts ';' store_curly_param_part { $$=$1; P($$, $3) } +; store_code_param_part: - empty /* optimized () case */ -| STRING { /* optimized (STRING) case */ + empty /* optimized [] case */ +| STRING { /* optimized [STRING] case */ $$=$1; O($$, OP_STORE_PARAM); } -| constructor_code_value { /* (something complex) */ +| constructor_code_value { /* [something complex] */ $$=$1; + O($$, OP_STORE_PARAM); } ; store_expr_param_part: write_expr_value { $$=N(POOL); + PEA($$, $1); +}; +store_curly_param_part: maybe_codes { + $$=N(POOL); PCA($$, $1); }; -write_expr_value: any_expr { +write_expr_value: expr_value { $$=$1; - O($$, OP_WRITE); + O($$, OP_WRITE_EXPR_RESULT); }; /* name */ @@ -393,7 +422,7 @@ name_expr_with_subvar_value: STRING subv $$=N(POOL); O($$, OP_CREATE_EWPOOL); P($$, $1); - O($$, OP_WRITE); + O($$, OP_WRITE_VALUE); P($$, $2); O($$, OP_REDUCE_EWPOOL); }; @@ -427,19 +456,14 @@ with: '$' name_without_curly_rdive '{' c O($$, OP_CREATE_RWPOOL); P($$, $4); O($$, OP_REDUCE_RWPOOL); - O($$, OP_WRITE); + O($$, OP_WRITE_VALUE); }; /* expr */ -any_expr: - empty_double_value /* optimized $var() case */ -| optimized_expr /* $var(something) */ -; -optimized_expr: expr { - if(($$=$1)->size()==2) { // only one string literal in there? +expr_value: expr { + if(($$=$1)->size()==2) // only one string literal in there? change_string_literal_to_double_literal($$); // make that string literal Double - } }; expr: STRING @@ -478,6 +502,7 @@ expr: | expr "ge" expr { $$=$1; P($$, $3); O($$, OP_STR_GE) } | expr "eq" expr { $$=$1; P($$, $3); O($$, OP_STR_EQ) } | expr "ne" expr { $$=$1; P($$, $3); O($$, OP_STR_NE) } +| expr "is" expr { $$=$1; P($$, $3); O($$, OP_IS) } ; string_inside_quotes_value: maybe_codes { @@ -489,16 +514,16 @@ string_inside_quotes_value: maybe_codes /* basics */ -write_str_literal: STRING { - $$=$1; - O($$, OP_WRITE); +write_string: STRING { + // optimized from OP_STRING+OP_WRITE_VALUE to OP_STRING__WRITE + change_string_literal_to_write_string_literal($$=$1) }; -empty_double_value: /* empty */ { $$=VL(NEW VDouble(POOL)) }; empty_string_value: /* empty */ { $$=VL(NEW VString(POOL)) }; empty: /* empty */ { $$=N(POOL) }; %% +#endif /* 000$111(2222)00 @@ -529,8 +554,8 @@ int yylex(YYSTYPE *lvalp, void *pc) { return result; } - char *begin=PC->source; - char *end; + const char *begin=PC->source; + const char *end; int begin_line=PC->line; int skip_analized=0; while(true) { @@ -728,10 +753,19 @@ int yylex(YYSTYPE *lvalp, void *pc) { break; case 'i': if(end==begin) // right after whitespace - if(PC->source[0]=='n') { // in - skip_analized=1; - result=IN; - goto break2; + switch(PC->source[0]) { + case 'n': + { // in + skip_analized=1; + result=IN; + goto break2; + } + case 's': + { // is + skip_analized=1; + result=IS; + goto break2; + } } break; case 'd': @@ -762,9 +796,7 @@ int yylex(YYSTYPE *lvalp, void *pc) { if(PC->ls==LS_EXPRESSION_VAR_NAME) { // name in expr ends also before binary operators switch(c) { - case '+': case '-': case '*': case '/': case '%': - case '&': case '|': - case '<': case '>': case '=': case '!': + case '-': pop_LS(PC); PC->source--; if(--PC->col<0) { PC->line--; PC->col=-1; } result=EON; @@ -776,6 +808,12 @@ int yylex(YYSTYPE *lvalp, void *pc) { case ' ': case '\t': case '\n': case ';': case ']': case '}': case ')': case '"': + case '<': case '>': // these stand for HTML brackets and expression binary ops + case '+': case '*': case '/': case '%': + case '&': case '|': + case '=': case '!': + // common delimiters + case '\'': case ',': pop_LS(PC); PC->source--; if(--PC->col<0) { PC->line--; PC->col=-1; } result=EON; @@ -910,6 +948,8 @@ int yylex(YYSTYPE *lvalp, void *pc) { case '^': push_LS(PC, LS_METHOD_NAME); RC; + case ';': // param delim + RC; case '}': if(--lexical_brackets_nestage==0) { PC->ls=LS_METHOD_AFTER; @@ -976,8 +1016,6 @@ break2: int real_yyerror(parse_control *pc, char *s) /* Called by yyparse on error */ { - //fprintf(stderr, "[%s]\n", s); - strncpy(pc->error, s, MAX_STRING); // TODO: перепроверить с треклятым последним байтом return 1; }