--- parser3/src/classes/op.C 2007/04/23 10:30:09 1.166 +++ parser3/src/classes/op.C 2016/11/01 23:10:40 1.243 @@ -1,12 +1,10 @@ /** @file Parser: parser @b operators. - Copyright (c) 2001-2005 ArtLebedev Group (http://www.artlebedev.com) + Copyright (c) 2001-2015 Art. Lebedev Studio (http://www.artlebedev.com) Author: Alexandr Petrosian (http://paf.design.ru) */ -static const char * const IDENT_OP_C="$Date: 2007/04/23 10:30:09 $"; - #include "classes.h" #include "pa_vmethod_frame.h" @@ -20,16 +18,11 @@ static const char * const IDENT_OP_C="$D #include "pa_vclass.h" #include "pa_charset.h" -// limits - -#define MAX_LOOPS 20000 +volatile const char * IDENT_OP_C="$Id: op.C,v 1.243 2016/11/01 23:10:40 moko Exp $"; // defines #define CASE_DEFAULT_VALUE "DEFAULT" -#define PROCESS_MAIN_OPTION_NAME "main" -#define PROCESS_FILE_OPTION_NAME "file" -#define PROCESS_LINENO_OPTION_NAME "lineno" // class @@ -38,15 +31,6 @@ public: VClassMAIN(); }; -// defines for globals - -#define CYCLE_DATA_NAME "CYCLE-DATA" - -// globals - -//^for & co -String cycle_data_name(CYCLE_DATA_NAME); - // defines for statics #define SWITCH_DATA_NAME "SWITCH-DATA" @@ -70,11 +54,11 @@ static const String exception_var_name(E // helpers -class Untaint_lang_name2enum: public Hash { +class Untaint_lang_name2enum: public HashString { public: Untaint_lang_name2enum() { - #define ULN(name, LANG) \ - put(String::Body(name), (value_type)(String::L_##LANG)); + #define ULN(name, LANG) put(name, (value_type)(String::L_##LANG)); + ULN("clean", CLEAN); ULN("as-is", AS_IS); ULN("optimized-as-is", AS_IS|String::L_OPTIMIZE_BIT); ULN("file-spec", FILE_SPEC); @@ -88,6 +72,8 @@ public: ULN("html", HTML); ULN("optimized-html", HTML|String::L_OPTIMIZE_BIT); ULN("regex", REGEX); + ULN("parser-code", PARSER_CODE); + ULN("json", JSON); #undef ULN } } untaint_lang_name2enum; @@ -95,59 +81,68 @@ public: // methods static void _if(Request& r, MethodParams& params) { - bool condition=params.as_bool(0, "condition must be expression", r); - if(condition) - r.write_pass_lang(r.process(*params.get(1))); - else if(params.count()>2) - r.write_pass_lang(r.process(*params.get(2))); + size_t max_param=params.count()-1; + size_t i=0; + do { + bool condition=params.as_bool(i, "condition must be expression", r); + if(condition) { + r.process_write(params[i+1]); + return; + } + i+=2; + } while (i < max_param); + + if(i == max_param) + r.process_write(params[i]); } -static void _untaint(Request& r, MethodParams& params) { +String::Language get_untaint_lang(const String& lang_name){ + String::Language lang=untaint_lang_name2enum.get(lang_name); + if(!lang) + throw Exception(PARSER_RUNTIME, &lang_name, "invalid taint language"); + return lang; +} +static void _untaint(Request& r, MethodParams& params) { String::Language lang; if(params.count()==1) - lang=String::L_AS_IS; // mark as simply 'tainted'. useful in html from sql - else { - const String& lang_name=params.as_string(0, "lang must be string"); - lang=untaint_lang_name2enum.get(lang_name); - if(!lang) - throw Exception(0, - &lang_name, - "invalid taint language"); - } + lang=String::L_AS_IS; // mark as simply 'as-is'. useful in html from sql + else + lang=get_untaint_lang(params.as_string(0, "lang must be string")); - { - Value& vbody=params.as_junction(params.count()-1, "body must be code"); - - Temp_lang temp_lang(r, lang); // set temporarily specified ^untaint[language; - r.write_pass_lang(r.process(vbody)); // process marking tainted with that lang - } + Value& vbody=params.as_junction(params.count()-1, "body must be code"); + Value& result=r.process(vbody); + + if(const String* string=result.get_string()){ + String &untainted=*new String(); + string->append_to(untainted, lang); // mark all tainted to specified language + r.write(untainted); + } else + r.write(result); // this is not normal, just backward compatibility } static void _taint(Request& r, MethodParams& params) { String::Language lang; if(params.count()==1) - lang=String::L_TAINTED; // mark as simply 'tainted'. useful in table:set - else { - const String& lang_name=params.as_string(0, "lang must be string"); - lang=untaint_lang_name2enum.get(lang_name); - if(!lang) - throw Exception(0, - &lang_name, - "invalid taint language"); - } + lang=String::L_TAINTED; // mark as simply 'tainted'. useful in table:create + else + lang=get_untaint_lang(params.as_string(0, "lang must be string")); { Value& vbody=params.as_no_junction(params.count()-1, "body must not be code"); - String result; - result.append( - vbody.as_string(), // process marking tainted with that lang - lang, true); // force result language to specified - r.write_pass_lang(result); + String result(vbody.as_string(), lang); // force result language to specified + r.write(result); } } +static void _apply_taint(Request& r, MethodParams& params) { + String::Language lang=params.count()==1 ? String::L_AS_IS : get_untaint_lang(params.as_string(0, "lang must be string")); + const String &sbody=params.as_string(params.count()-1, "body must be string"); + String::Body result_body=sbody.cstr_to_string_body_untaint(lang, r.connection(false), &r.charsets); + r.write(*new String(result_body, String::L_AS_IS)); +} + static void _process(Request& r, MethodParams& params) { Method* main_method; @@ -157,70 +152,63 @@ static void _process(Request& r, MethodP if(maybe_target_self.get_string() || maybe_target_self.get_junction()) target_self=&r.get_method_frame()->caller()->self(); else { - target_self=&maybe_target_self; index++; + target_self=&maybe_target_self; + if(params.count()==1) + throw Exception(PARSER_RUNTIME, 0, "no body specified"); + index++; } { - VStateless_class *target_class=target_self->get_last_derived_class(); + VStateless_class *target_class=target_self->get_class(); if(!target_class) - throw Exception(PARSER_RUNTIME, - 0, - "no target class"); + throw Exception(PARSER_RUNTIME, 0, "no target class"); - // temporary remove language change - Temp_lang temp_lang(r, String::L_PASS_APPENDED); // temporary zero @main so to maybe-replace it in processed code Temp_method temp_method_main(*target_class, main_method_name, 0); - // temporary zero @auto so it wouldn't be auto-called in Request::use_buf - Temp_method temp_method_auto(*target_class, auto_method_name, 0); - - size_t options_index=index+1; - HashStringValue* options=0; - if(options_indexget(PROCESS_MAIN_OPTION_NAME)) { - valid_options++; - main_alias=&vmain_alias->as_string(); - } - if(Value* vfile_alias=options->get(PROCESS_FILE_OPTION_NAME)) { - valid_options++; - file_alias=&vfile_alias->as_string(); - } - if(Value* vline_no_alias_offset=options->get(PROCESS_LINENO_OPTION_NAME)) { - valid_options++; - line_no_alias_offset=vline_no_alias_offset->as_int(); + bool allow_class_replace=false; + + size_t options_index=index+1; + if(options_indexas_string(); + } else if(key == "file") { + valid_options++; + file_alias=&value->as_string(); + } else if(key == "lineno") { + valid_options++; + line_no_alias_offset=value->as_int(); + } else if(key == "replace") { + valid_options++; + allow_class_replace=r.process(*value).as_bool(); + } + } + + if(valid_options!=options->count()) + throw Exception(PARSER_RUNTIME, 0, CALLED_WITH_INVALID_OPTION); } - - if(valid_options!=options->count()) - throw Exception(PARSER_RUNTIME, - 0, - "called with invalid option"); - } - uint processe_file_no=file_alias? - r.register_file(r.absolute(*file_alias)) - : pseudo_file_no__process; + uint processe_file_no=file_alias ? r.register_file(r.absolute(*file_alias)) : pseudo_file_no__process; // process...{string} Value& vjunction=params.as_junction(index, "body must be code"); // evaluate source to process const String& source=r.process_to_string(vjunction); - r.use_buf(*target_class, - source.cstr(String::L_UNSPECIFIED, r.connection(false)), - main_alias, - processe_file_no, - line_no_alias_offset); + + Temp_class_replace class_replace(r, allow_class_replace); + + r.use_buf(*target_class, source.untaint_cstr(String::L_PARSER_CODE, r.connection(false)), main_alias, processe_file_no, line_no_alias_offset); // main_method main_method=target_class->get_method(main_method_name); @@ -228,10 +216,10 @@ static void _process(Request& r, MethodP // after restoring current-request-lang // maybe-execute @main[] if(main_method) { - // temporarily set method_frame's self to target_self - Temp_method_frame_self tmfs(*r.get_method_frame(), *target_self); - // execute! - r.execute(*main_method->parser_code); + VMethodFrame frame(*main_method, r.get_method_frame()->caller(), *target_self); + frame.empty_params(); + r.call(frame); + r.write(frame.result()); } } @@ -240,152 +228,186 @@ static void _rem(Request&, MethodParams& } static void _while(Request& r, MethodParams& params) { - Temp_hash_value - cycle_data_setter(r.classes_conf, cycle_data_name, /*any not null flag*/&r); + InCycle temp(r); + + Value& vcondition=params.as_expression(0, "condition must be number, bool or expression"); - Value& vcondition=params.as_junction(0, "condition must be expression"); Value& body_code=params.as_junction(1, "body must be code"); Value* delim_maybe_code=params.count()>2?¶ms[2]:0; // while... int endless_loop_count=0; - bool need_delim=false; - while(true) { - if(++endless_loop_count>=MAX_LOOPS) // endless loop? - throw Exception(PARSER_RUNTIME, - 0, - "endless loop detected"); - - bool condition=r.process_to_value(vcondition, - false/*don't intercept string*/).as_bool(); - if(!condition) // ...condition is true - break; + if(delim_maybe_code){ // delimiter set + bool need_delim=false; + while(true) { + if(++endless_loop_count>=pa_loop_limit) // endless loop? + throw Exception(PARSER_RUNTIME, 0, "endless loop detected"); + + if(!r.process(vcondition).as_bool()) + break; + + Value& sv_processed=r.process(body_code); + Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); + + const String* s_processed=sv_processed.get_string(); + if(s_processed && !s_processed->is_empty()) { // we have body + if(need_delim) // need delim & iteration produced string? + r.write(r.process(*delim_maybe_code)); + else + need_delim=true; + } + r.write(sv_processed); - StringOrValue sv_processed=r.process(body_code); - Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); - const String* s_processed=sv_processed.get_string(); - if(delim_maybe_code && s_processed && s_processed->length()) { // delimiter set and we have body - if(need_delim) // need delim & iteration produced string? - r.write_pass_lang(r.process(*delim_maybe_code)); - need_delim=true; + if(lskip==Request::SKIP_BREAK) + break; } - r.write_pass_lang(sv_processed); + } else { + while(true) { + if(++endless_loop_count>=pa_loop_limit) // endless loop? + throw Exception(PARSER_RUNTIME, 0, "endless loop detected"); - if(lskip==Request::SKIP_BREAK) - break; + if(!r.process(vcondition).as_bool()) + break; + + r.process_write(body_code); + Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); + + if(lskip==Request::SKIP_BREAK) + break; + } } } static void _use(Request& r, MethodParams& params) { - Value& vfile=params.as_no_junction(0, "file name must not be code"); - r.use_file(r.main_class, vfile.as_string()); + Value& vfile=params.as_no_junction(0, FILE_NAME_MUST_NOT_BE_CODE); + + bool allow_class_replace=false; + + if(params.count()==2) + if(HashStringValue* options=params.as_hash(1)) { + int valid_options=0; + for(HashStringValue::Iterator i(*options); i; i.next() ){ + + String::Body key=i.key(); + Value* value=i.value(); + + if(key == "replace") { + valid_options++; + allow_class_replace=r.process(*value).as_bool(); + } + + if(valid_options!=options->count()) + throw Exception(PARSER_RUNTIME, 0, CALLED_WITH_INVALID_OPTION); + } + } + + Temp_class_replace class_replace(r, allow_class_replace); + + // _use could be called from the parser3 method only, so caller is always defined + r.use_file(r.main_class, vfile.as_string(), r.get_method_filename(&r.get_method_frame()->caller()->method)); } static void set_skip(Request& r, Request::Skip askip) { - void* data=r.classes_conf.get(cycle_data_name); - if(!data) - throw Exception(PARSER_RUNTIME, - 0, - "without cycle"); - + if(!r.get_in_cycle()) + throw Exception(askip==Request::SKIP_BREAK ? "parser.break" : "parser.continue", 0, "without cycle"); r.set_skip(askip); } -static void _break(Request& r, MethodParams&) { - set_skip(r, Request::SKIP_BREAK); +static void _break(Request& r, MethodParams& params) { + if(!params.count() || params.as_bool(0, "condition must be expression", r)) set_skip(r, Request::SKIP_BREAK); } -static void _continue(Request& r, MethodParams&) { - set_skip(r, Request::SKIP_CONTINUE); +static void _continue(Request& r, MethodParams& params) { + if(!params.count() || params.as_bool(0, "condition must be expression", r)) set_skip(r, Request::SKIP_CONTINUE); } static void _for(Request& r, MethodParams& params) { - Temp_hash_value - cycle_data_setter(r.classes_conf, cycle_data_name, /*any not null flag*/&r); + InCycle temp(r); const String& var_name=params.as_string(0, "var name must be string"); int from=params.as_int(1, "from must be int", r); int to=params.as_int(2, "to must be int", r); - Value& body_code=params.as_junction(3, "body must be code"); + Value& body_code=params.as_junction(3, "body must be code"); Value* delim_maybe_code=params.count()>4?¶ms[4]:0; - if(to-from>=MAX_LOOPS) // too long loop? - throw Exception(PARSER_RUNTIME, - 0, - "endless loop detected"); + if(to-from>=pa_loop_limit) // too long loop? + throw Exception(PARSER_RUNTIME, 0, "endless loop detected"); - bool need_delim=false; VInt* vint=new VInt(0); VMethodFrame& caller=*r.get_method_frame()->caller(); - caller.put_element(caller, var_name, vint, false); - for(int i=from; i<=to; i++) { - vint->set_int(i); - - StringOrValue sv_processed=r.process(body_code); - Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); - const String* s_processed=sv_processed.get_string(); - if(delim_maybe_code && s_processed && s_processed->length()) { // delimiter set and we have body - if(need_delim) // need delim & iteration produced string? - r.write_pass_lang(r.process(*delim_maybe_code)); - need_delim=true; + r.put_element(caller, var_name, vint); + if(delim_maybe_code){ // delimiter set + bool need_delim=false; + + for(int i=from; i<=to; i++) { + vint->set_int(i); + + Value& sv_processed=r.process(body_code); + Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); + + const String* s_processed=sv_processed.get_string(); + if(s_processed && !s_processed->is_empty()) { // we have body + if(need_delim) // need delim & iteration produced string? + r.write(r.process(*delim_maybe_code)); + else + need_delim=true; + } + r.write(sv_processed); + + if(lskip==Request::SKIP_BREAK) + break; } - r.write_pass_lang(sv_processed); + } else { + for(int i=from; i<=to; i++) { + vint->set_int(i); + + r.process_write(body_code); + Request::Skip lskip=r.get_skip(); r.set_skip(Request::SKIP_NOTHING); - if(lskip==Request::SKIP_BREAK) - break; + if(lskip==Request::SKIP_BREAK) + break; + } } } static void _eval(Request& r, MethodParams& params) { Value& expr=params.as_junction(0, "need expression"); // evaluate expresion - Value& value_result=r.process_to_value(expr, - false/*don't intercept string*/).as_expr_result(); + Value& value_result=r.process(expr).as_expr_result(); if(params.count()>1) { - Value& fmt=params.as_no_junction(1, "fmt must not be code"); - r.write_no_lang(String(format(value_result.as_double(), fmt.as_string().cstrm()))); + const String& fmt=params.as_string(1, "fmt must be string").trim(); + if(fmt.is_empty()){ + r.write(value_result); + } else { + r.write(String(format(value_result.as_double(), fmt.cstrm()))); + } } else - r.write_no_lang(value_result); + r.write(value_result); } static void _connect(Request& r, MethodParams& params) { -#ifdef RESOURCES_DEBUG -struct timeval mt[2]; -#endif Value& url=params.as_no_junction(0, "url must not be code"); Value& body_code=params.as_junction(1, "body must be code"); Table* protocol2driver_and_client=0; - if(Value* sql=r.main_class.get_element(String(MAIN_SQL_NAME), r.main_class, false)) { - if(Value* element=sql->get_element(String(MAIN_SQL_DRIVERS_NAME), *sql, false)) { + if(Value* sql=r.main_class.get_element(String(MAIN_SQL_NAME))) { + if(Value* element=sql->get_element(String(MAIN_SQL_DRIVERS_NAME))) { protocol2driver_and_client=element->get_table(); } } -#ifdef RESOURCES_DEBUG -//measure:before -gettimeofday(&mt[0],NULL); -#endif // connect SQL_Connection* connection=SQL_driver_manager->get_connection(url.as_string(), protocol2driver_and_client, - r.charsets.source().NAME().cstr()); + r.charsets.source().NAME().cstr(), + r.request_info.document_root); -#ifdef RESOURCES_DEBUG -//measure:after connect -gettimeofday(&mt[1],NULL); - -double t[2]; -for(int i=0;i<2;i++) - t[i]=mt[i].tv_sec+mt[i].tv_usec/1000000.0; - -r.sql_connect_time+=t[1]-t[0]; -#endif Temp_connection temp_connection(r, connection); + // execute body try { - r.write_assign_lang(r.process(body_code)); + r.process_write(body_code); connection->commit(); connection->close(); } catch(...) { // process problem @@ -399,25 +421,37 @@ r.sql_connect_time+=t[1]-t[0]; class Switch_data: public PA_Object { public: Request& r; - Value& searching; + const String* searching_string; + double searching_double; + bool searching_bool; Value* found; Value* _default; public: Switch_data(Request& ar, Value& asearching): - r(ar), searching(asearching) {} + r(ar) + { + if(asearching.is_string() || asearching.is_void()){ + searching_string=&asearching.as_string(); + searching_double=0; + searching_bool=false; + } else { + searching_string=0; + searching_double=asearching.as_double(); + searching_bool=asearching.is_bool(); + } + } }; #endif static void _switch(Request& r, MethodParams& params) { - Switch_data* data=new Switch_data(r, r.process_to_value(params[0])); - Temp_hash_value - switch_data_setter(r.classes_conf, switch_data_name, data); + Switch_data* data=new Switch_data(r, r.process(params[0])); + Temp_hash_value, void*> switch_data_setter(&r.classes_conf, switch_data_name, data); Value& cases_code=params.as_junction(1, "switch cases must be code"); // execution of found ^case[...]{code} must be in context of ^switch[...]{code} // because of stacked WWrapper used there as wcontext - r.process(cases_code, true/*intercept_string*/); + r.process(cases_code); if(Value* selected_code=data->found? data->found: data->_default) - r.write_pass_lang(r.process(*selected_code)); + r.write(r.process(*selected_code)); } static void _case(Request& r, MethodParams& params) { @@ -427,52 +461,71 @@ static void _case(Request& r, MethodPara 0, "without switch"); + if(data->found) // matches already was found + return; + int count=params.count(); - Value& code=params.as_junction(--count, "case result must be code"); + Value* code=¶ms.as_expression(--count, "case result must be code"); + +#ifdef USE_DESTRUCTORS + Junction *j=code->get_junction(); + if (j){ + code=new VJunction(j->self,j->method,j->method_frame,j->rcontext,j->wcontext,j->code); + if (j->wcontext) j->wcontext->attach_junction((VJunction *)code); + } +#endif - Value& searching=data->searching; - bool we_are_searching_string_or_void=searching.is_string() || searching.is_void(); - for(int i=0; i_default=&code; - break; + if(value.is_string() && value.as_string() == CASE_DEFAULT_VALUE){ + data->_default=code; + continue; } bool matches; - if(we_are_searching_string_or_void) - matches=searching.as_string() == value.as_string(); + if(data->searching_string) + matches=(*data->searching_string) == value.as_string(); + else if(data->searching_bool || value.is_bool()) + matches=(data->searching_double != 0) == value.as_bool(); else - matches=searching.as_double() == value.as_double(); - - if(matches) { - if(data->found) - throw Exception(PARSER_RUNTIME, - 0, - "duplicate found"); + matches=data->searching_double == value.as_double(); - data->found=&code; + if(matches){ + data->found=code; break; } } } #ifndef DOXYGEN struct Try_catch_result { - StringOrValue processed_code; + ValueRef processed_code; const String* exception_should_be_handled; Try_catch_result(): exception_should_be_handled(0) {} }; + +/// Auto-object used for temporary changing Request::skip. +class Temp_skip { + Request& frequest; + Request::Skip saved_skip; +public: + Temp_skip(Request& arequest) : frequest(arequest), saved_skip(arequest.get_skip()) { + arequest.set_skip(Request::SKIP_NOTHING); + } + ~Temp_skip() { + if(frequest.get_skip() == Request::SKIP_NOTHING) + frequest.set_skip(saved_skip); + } +}; #endif /// used by ^try and ^cache, @returns $exception.handled[string] if any template -static Try_catch_result try_catch(Request& r, - StringOrValue body_code(Request&, I), I info, - Value* catch_code, bool could_be_handled_by_caller=false) -{ +static Try_catch_result try_catch(Request& r, Value& body_code(Request&, I), I info, Value* catch_code, bool could_be_handled_by_caller=false) { Try_catch_result result; + + // minor bug: context not restored if only finally code is present, see #1062 if(!catch_code) { result.processed_code=body_code(r, info); return result; @@ -483,42 +536,44 @@ static Try_catch_result try_catch(Reques try { result.processed_code=body_code(r, info); } catch(const Exception& e) { - Request_context_saver throw_context(r); // taking snapshot of throw-context [stack trace contains error] + Request_context_saver throw_context(r); // remembering exception stack trace + Request::Exception_details details=r.get_details(e); - try_context.restore(); // restoring try-context to perform catch-code - Junction* junction=catch_code->get_junction(); - Value* method_frame=junction->method_frame; - Value* saved_exception_var_value=method_frame->get_element(exception_var_name, *method_frame, false); - VMethodFrame& frame=*junction->method_frame; - frame.put_element(frame, exception_var_name, &details.vhash, false); - result.processed_code=r.process(*catch_code); + try_context.restore(); // restoring try-context for code after try and catch-code + + { + Temp_value_element temp(r, *catch_code->get_junction()->method_frame, exception_var_name, &details.vhash); + Temp_skip temp_skip(r); + result.processed_code=r.process(*catch_code); + } - // retriving $exception.handled, restoring $exception var + // retriving $exception.handled Value* vhandled=details.vhash.hash().get(exception_handled_part_name); - frame.put_element(frame, exception_var_name, saved_exception_var_value, false); bool bhandled=false; if(vhandled) { if(vhandled->is_string()) { // not simple $exception.handled(1/0)? - if(could_be_handled_by_caller) { // and we can possibly handle it + if(bhandled=could_be_handled_by_caller) { // and we can possibly handle it result.exception_should_be_handled=vhandled->get_string(); // considering 'recovered' and let the caller recover - return result; } - - bhandled=false; } else - bhandled=vhandled->as_bool(); + bhandled=vhandled->as_bool(); } - if(!bhandled) { - throw_context.restore(); // restoring throw-context [exception were not handled] + if(!bhandled){ + throw_context.restore(); // restoring exception stack trace creared by try_context.restore() rethrow; } } + return result; } +static Value& process_try_body_code(Request& r, Value* body_code) { + return r.process(*body_code); +} + // cache-- // consts @@ -535,7 +590,7 @@ struct Data_string_serialized_prolog { #endif void cache_delete(const String& file_spec) { - file_delete(file_spec, false/*fail_on_read_problem*/); + file_delete(file_spec, false/*fail_on_problem*/); } #ifndef DOXYGEN @@ -547,15 +602,16 @@ public: struct Locked_process_and_cache_put_action_info { Request *r; Cache_scope *scope; - Value* body_code; Value* catch_code; + Value* body_code; + Value* catch_code; const String* processed_code; }; #endif -static StringOrValue process_cache_body_code(Request& r, Value* body_code) { - return StringOrValue(r.process_to_string(*body_code)); +static Value& process_cache_body_code(Request& r, Value* body_code) { + return r.process(*body_code); } /* @todo maybe network order worth spending some effort? @@ -566,7 +622,6 @@ static void locked_process_and_cache_put Locked_process_and_cache_put_action_info& info= *static_cast(context); - const String* body_from_disk=info.scope->body_from_disk; // body->process Try_catch_result result=try_catch(*info.r, @@ -580,10 +635,10 @@ static void locked_process_and_cache_put } else throw Exception(PARSER_RUNTIME, result.exception_should_be_handled, - "$"EXCEPTION_VAR_NAME"."EXCEPTION_HANDLED_PART_NAME" value must be " - "either boolean or string '"CACHE_EXCEPTION_HANDLED_CACHE_NAME"'"); + "$" EXCEPTION_VAR_NAME "." EXCEPTION_HANDLED_PART_NAME " value must be " + "either boolean or string '" CACHE_EXCEPTION_HANDLED_CACHE_NAME "'"); } else - info.processed_code=&result.processed_code.as_string(); + info.processed_code=&((Value &)result.processed_code).as_string(); // expiration time not spoiled by ^cache(0) or something? if(info.scope->expires > time(0)) { @@ -610,22 +665,27 @@ const String* locked_process_and_cache_p const String* result=file_write_action_under_lock( file_spec, - "cache_put", locked_process_and_cache_put_action, &info, + "cache_put", + locked_process_and_cache_put_action, + &info, false/*as_text*/, false/*do_append*/, - false/*block*/, - false/*fail on lock problem*/) ? info.processed_code: 0; + false/*block == don't wait till other thread release lock*/, + false/*dun throw exception if lock failed*/) ? info.processed_code: 0; + time_t now=time(0); if(scope.expires<=now) cache_delete(file_spec); return result; } + #ifndef DOXYGEN struct Cache_get_result { const String* body; bool expired; }; #endif + static Cache_get_result cache_get(Request_charsets& charsets, const String& file_spec, time_t now) { Cache_get_result result={0, false}; @@ -655,33 +715,32 @@ static Cache_get_result cache_get(Reques static time_t as_expires(Request& r, MethodParams& params, int index, time_t now) { time_t result; - if(Value* vdate=params[index].as(VDATE_TYPE, false)) - result=static_cast(vdate)->get_time(); + if(Value* vdate=params[index].as(VDATE_TYPE)) + result=(time_t)(static_cast(vdate)->get_time()); else result=now+(time_t)params.as_double(index, "lifespan must be date or number", r); return result; } + static const String& as_file_spec(Request& r, MethodParams& params, int index) { return r.absolute(params.as_string(index, "filespec must be string")); } + static void _cache(Request& r, MethodParams& params) { - if(params.count()==0) - { - // return current expiration time + if(params.count()==0) { + // ^cache[] -- return current expiration time Cache_scope* scope=static_cast(r.classes_conf.get(cache_data_name)); if(!scope) - throw Exception(PARSER_RUNTIME, - 0, - "expire-time get without cache"); - r.write_no_lang(*new VDate(scope->expires)); + throw Exception(PARSER_RUNTIME, 0, "expire-time get without cache"); + r.write(*new VDate((pa_time_t)scope->expires)); return; } time_t now=time(0); - // ^cache[filename] ^cache(seconds) ^cache[expires date] if(params.count()==1) { + // ^cache[filename] ^cache(seconds) ^cache[expires date] if(params[0].is_string()) { // filename? cache_delete(as_file_spec(r, params, 0)); return; @@ -705,98 +764,94 @@ static void _cache(Request& r, MethodPar "invalid number of parameters"); // file_spec, expires, body code - const String& file_spec=r.absolute(params.as_string(0, "filespec must be string")); + const String& file_spec=as_file_spec(r, params, 0); Cache_scope scope={as_expires(r, params, 1, now), 0}; - Temp_hash_value - cache_scope_setter(r.classes_conf, cache_data_name, &scope); + Temp_hash_value, void*> cache_scope_setter(&r.classes_conf, cache_data_name, &scope); Value& body_code=params.as_junction(2, "body_code must be code"); Value* catch_code=0; if(params.count()>3) catch_code=¶ms.as_junction(3, "catch_code must be code"); - if(scope.expires>now) { // valid 'expires' specified? try cached copy... - // hence we don't hope to have unary create/lockEX - // we need some plan to live in a life like that, so... - // worst races plan: - // A B - // open - // |open - // lockSH - // |nonblocking-lockEX fails - // unlockSH - // close, cache_get returns 0 - // open - // nonblocking-lockEX succeeds; process, write, close - // |retry1: open - // ... - // |lockSH succeeds; ... - - for(int retry=0; retry<2; retry++) { - Cache_get_result cached=cache_get(r.charsets, file_spec, now); - if(cached.body) { // have cached copy - if(cached.expired) - scope.body_from_disk=cached.body; // storing for user to retrive it with ^cache[] - else // and it's not expired yet - { - // write it out - r.write_assign_lang(*cached.body); - // happy with it - return; - } - } + if(scope.expires>now) { + Cache_get_result cached=cache_get(r.charsets, file_spec, now); - // non-blocked lock; process; cache it - if(const String* processed_body= - locked_process_and_cache_put(r, body_code, catch_code, scope, file_spec)) { - // write it out - r.write_assign_lang(*processed_body); - // happy with it - return; - } else { // somebody writing result right now - pa_sleep(0, 500000); // waiting half a second - retry=0; // prolonging our wait, than could cache_get it, without processing body_code - } - } - throw Exception(0, - &file_spec, - "locking problem"); + if(cached.body) { // have cached copy + if(cached.expired) { + scope.body_from_disk=cached.body; // storing for user to retrive it with ^cache[] + } else { + // and it's not expired yet write it out + r.write(*cached.body); + // happy with it + return; + } + } + + // no cached info or it's already expired + + // trying to process it under lock and store result in file + const String* processed_body=locked_process_and_cache_put(r, body_code, catch_code, scope, file_spec); + if(processed_body){ + // write it out + r.write(*processed_body); + // happy with it + return; + } else { + // we fail while get exclusive lock. nvm, we just execute body_code a bit later + } } else { // instructed not to cache; forget cached copy cache_delete(file_spec); - // process - const String& processed_body=r.process_to_string(body_code); - // write it out - r.write_assign_lang(processed_body); - // happy with it - return; } - // never reached + + // process without caching + if(catch_code){ + Try_catch_result result=try_catch(r, process_try_body_code, &body_code, catch_code); + r.write(result.processed_code); + } else { + r.write(r.process_to_string(body_code)); + } } -static StringOrValue process_try_body_code(Request& r, Value* body_code) { - return r.process(*body_code); -} static void _try_operator(Request& r, MethodParams& params) { Value& body_code=params.as_junction(0, "body_code must be code"); Value& catch_code=params.as_junction(1, "catch_code must be code"); + Value* finally_code=(params.count()==3) ? ¶ms.as_junction(2, "finally_code must be code") : 0; - Try_catch_result result=try_catch(r, - process_try_body_code, &body_code, - &catch_code); - - if(result.exception_should_be_handled) - throw Exception(PARSER_RUNTIME, - result.exception_should_be_handled, - "catch block must set $exception.handled to some boolean value, not string"); + Try_catch_result result; + + try{ + // process try and catch code + result=try_catch(r, process_try_body_code, &body_code, &catch_code); + } catch(...){ + // process finally code but ignore the result + if(finally_code){ + Temp_skip temp(r); + Value &finally_result=r.process(*finally_code); + } + rethrow; + } + + // process finally code + if(finally_code){ + Temp_skip temp(r); + Value& finally_result=r.process(*finally_code); + + // no exception in try/catch or finally, writing processed body_code or catch_code + r.write(result.processed_code); + + // write out processed finally code + r.write(finally_result); + } else { + // no exception in try/catch, writing processed body_code or catch_code + r.write(result.processed_code); + } - // write out processed body_code or catch_code - r.write_pass_lang(result.processed_code); } static void _throw_operator(Request&, MethodParams& params) { - if(params.count()==1) { + if(params.count()==1 && !params[0].is_string()) { if(HashStringValue *hash=params[0].get_hash()) { const char* type=0; if(Value* value=hash->get(exception_type_part_name)) @@ -814,19 +869,19 @@ static void _throw_operator(Request&, Me } else throw Exception(PARSER_RUNTIME, 0, - "one-param version has hash param"); + "one-param version has hash or string param"); } else { const char* type=params.as_string(0, "type must be string").cstr(); - const String& source=params.as_string(1, "source must be string"); - const char* comment=params.count()>2? params.as_string(2, "comment must be string").cstr() - :0; - throw Exception(type, &source, "%s", comment?comment:""); + const String* source=params.count()>1? ¶ms.as_string(1, "source must be string"):0; + const char* comment=params.count()>2? params.as_string(2, "comment must be string").cstr():0; + throw Exception(type, source, "%s", comment?comment:""); } } static void _sleep_operator(Request& r, MethodParams& params) { double seconds=params.as_double(0, "seconds must be double", r); - pa_sleep((int)trunc(seconds), (int)trunc(seconds*1000)); + if(seconds>0) + pa_sleep((int)trunc(seconds), (int)trunc((seconds-trunc(seconds))*1000000)); } #if defined(WIN32) && defined(_DEBUG) @@ -838,8 +893,7 @@ static void _bpt(Request&, MethodParams& // constructor -VClassMAIN::VClassMAIN(): VClass() { - set_name(*new String(MAIN_CLASS_NAME)); +VClassMAIN::VClassMAIN(): VClass(MAIN_CLASS_NAME) { #ifdef PA_BPT // ^bpt[] @@ -848,36 +902,45 @@ VClassMAIN::VClassMAIN(): VClass() { // ^if(condition){code-when-true} // ^if(condition){code-when-true}{code-when-false} - add_native_method("if", Method::CT_ANY, _if, 2, 3); + // ^if(condition){code-when-true} (another condition){code-when-true} ... {code-when-false} + add_native_method("if", Method::CT_ANY, _if, 2, 10000, Method::CO_WITHOUT_FRAME); + + // ^untaint[as-is|uri|sql|js|html|html-typo|regex|parser-code]{code} + add_native_method("untaint", Method::CT_ANY, _untaint, 1, 2, Method::CO_WITHOUT_FRAME); - // ^untaint[as-is|uri|sql|js|html|html-typo]{code} - add_native_method("untaint", Method::CT_ANY, _untaint, 1, 2); + // ^taint[as-is|uri|sql|js|html|html-typo|regex|parser-code]{code} + add_native_method("taint", Method::CT_ANY, _taint, 1, 2, Method::CO_WITHOUT_FRAME); - // ^taint[as-is|uri|sql|js|html|html-typo]{code} - add_native_method("taint", Method::CT_ANY, _taint, 1, 2); + // ^apply-taint[untaint lang][string] + add_native_method("apply-taint", Method::CT_ANY, _apply_taint, 1, 2, Method::CO_WITHOUT_FRAME); - // ^process[code] + // ^process{code} + // ^process[context]{code}[options hash] add_native_method("process", Method::CT_ANY, _process, 1, 3); // ^rem{code} - add_native_method("rem", Method::CT_ANY, _rem, 1, 10000); + add_native_method("rem", Method::CT_ANY, _rem, 1, 10000, Method::CO_WITHOUT_FRAME); // ^while(condition){code} - add_native_method("while", Method::CT_ANY, _while, 2, 3); + add_native_method("while", Method::CT_ANY, _while, 2, 3, Method::CO_WITHOUT_FRAME); - // ^use[file] - add_native_method("use", Method::CT_ANY, _use, 1, 1); + // ^use[file[;options hash]] + add_native_method("use", Method::CT_ANY, _use, 1, 2); // ^break[] - add_native_method("break", Method::CT_ANY, _break, 0, 0); + // ^break(condition) + add_native_method("break", Method::CT_ANY, _break, 0, 1, Method::CO_WITHOUT_FRAME); + // ^continue[] - add_native_method("continue", Method::CT_ANY, _continue, 0, 0); + // ^continue(condition) + add_native_method("continue", Method::CT_ANY, _continue, 0, 1, Method::CO_WITHOUT_FRAME); + // ^for[i](from-number;to-number-inclusive){code}[delim] add_native_method("for", Method::CT_ANY, _for, 3+1, 3+1+1); // ^eval(expr) // ^eval(expr)[format] - add_native_method("eval", Method::CT_ANY, _eval, 1, 2); + add_native_method("eval", Method::CT_ANY, _eval, 1, 2, Method::CO_WITHOUT_FRAME); // ^connect[protocol://user:pass@host[:port]/database]{code with ^sql-s} add_native_method("connect", Method::CT_ANY, _connect, 2, 2); @@ -891,15 +954,15 @@ VClassMAIN::VClassMAIN(): VClass() { // switch // ^switch[value]{cases} - add_native_method("switch", Method::CT_ANY, _switch, 2, 2); + add_native_method("switch", Method::CT_ANY, _switch, 2, 2, Method::CO_WITHOUT_FRAME); // ^case[value]{code} - add_native_method("case", Method::CT_ANY, _case, 2, 10000); + add_native_method("case", Method::CT_ANY, _case, 2, 10000, Method::CO_WITHOUT_FRAME); // try-catch // ^try{code}{catch code} - add_native_method("try", Method::CT_ANY, _try_operator, 2, 2); + add_native_method("try", Method::CT_ANY, _try_operator, 2, 3, Method::CO_WITHOUT_FRAME); // ^throw[$exception hash] // ^throw[type;source;comment] add_native_method("throw", Method::CT_ANY, _throw_operator, 1, 3);