--- parser3/src/classes/op.C 2001/09/05 09:02:52 1.40 +++ parser3/src/classes/op.C 2002/02/08 08:30:10 1.71 @@ -1,14 +1,13 @@ /** @file Parser: parser @b operators. - Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) + Copyright (c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com) + Author: Alexandr Petrosian (http://paf.design.ru) - Author: Alexander Petrosyan (http://design.ru/paf) + $Id: op.C,v 1.71 2002/02/08 08:30:10 paf Exp $ */ -static const char *RCSId="$Id: op.C,v 1.40 2001/09/05 09:02:52 parser Exp $"; #include "classes.h" -#include "pa_config_includes.h" #include "pa_common.h" #include "pa_request.h" #include "pa_vint.h" @@ -39,30 +38,34 @@ private: // methods static void _if(Request& r, const String&, MethodParams *params) { - Value& condition_code=params->get(0); + Value& condition_code=params->as_junction(0, "condition must be expression"); bool condition=r.process(condition_code, 0/*no name*/, false/*don't intercept string*/).as_bool(); if(condition) r.write_pass_lang(r.process(params->as_junction(1, "'then' parameter must be code"))); - else if(params->size()==3) + else if(params->size()>2) r.write_pass_lang(r.process(params->as_junction(2, "'else' parameter must be code"))); } static void _untaint(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); - const String& lang_name=r.process(params->get(0)).as_string(); - String::Untaint_lang lang=static_cast( - untaint_lang_name2enum->get_int(lang_name)); - if(!lang) - PTHROW(0, 0, - &lang_name, - "invalid untaint language"); + uchar lang; + if(params->size()==1) + lang=String::UL_AS_IS; // mark as simply 'tainted'. useful in html from sql + else { + const String& lang_name=params->as_string(0, "lang must be string"); + lang=untaint_lang_name2enum->get_int(lang_name); + if(!lang) + throw Exception(0, 0, + &lang_name, + "invalid taint language"); + } { - Value& vbody=params->as_junction(1, "body must be code"); + Value& vbody=params->as_junction(params->size()-1, "body must be code"); Temp_lang temp_lang(r, lang); // set temporarily specified ^untaint[language; r.write_pass_lang(r.process(vbody)); // process marking tainted with that lang @@ -72,16 +75,14 @@ static void _untaint(Request& r, const S static void _taint(Request& r, const String&, MethodParams *params) { Pool& pool=r.pool(); - String::Untaint_lang lang; + uchar lang; if(params->size()==1) lang=String::UL_TAINTED; // mark as simply 'tainted'. useful in table:set else { - const String& lang_name= - r.process(params->get(0)).as_string(); - lang=static_cast( - untaint_lang_name2enum->get_int(lang_name)); + const String& lang_name=params->as_string(0, "lang must be string"); + lang=untaint_lang_name2enum->get_int(lang_name); if(!lang) - PTHROW(0, 0, + throw Exception(0, 0, &lang_name, "invalid taint language"); } @@ -119,11 +120,14 @@ static void _process(Request& r, const S // evaluate source to process const String& source= - r.process(params->get(0)).as_string(); + r.process(params->as_junction(0, "body must be code")).as_string(); // process source code, append processed methods to 'self' class // maybe-define new @main - r.use_buf(source.cstr(), place, &self_class); + r.use_buf( + source.cstr(String::UL_UNSPECIFIED, r.connection(0)), + place, + &self_class); // maybe-execute @main[] if(const Method *method=self_class.get_method(*main_method_name)) { @@ -147,7 +151,7 @@ static void _while(Request& r, const Str int endless_loop_count=0; while(true) { if(++endless_loop_count>=MAX_LOOPS) // endless loop? - PTHROW(0, 0, + throw Exception(0, 0, &method_name, "endless loop detected"); @@ -171,28 +175,28 @@ static void _use(Request& r, const Strin static void _for(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); - const String& var_name=r.process(params->get(0)).as_string(); - int from=r.process(params->get(1)).as_int(); - int to=r.process(params->get(2)).as_int(); + const String& var_name=params->as_string(0, "var name must be string"); + int from=params->as_int(1, "from must be int", r); + int to=params->as_int(2, "to must be int", r); Value& body_code=params->as_junction(3, "body must be code"); - Value *delim_code=params->size()==3+1+1?¶ms->get(3+1):0; + Value *delim_maybe_code=params->size()>4?¶ms->get(4):0; + + if(to-from>=MAX_LOOPS) // too long loop? + throw Exception(0, 0, + &method_name, + "endless loop detected"); bool need_delim=false; VInt *vint=new(pool) VInt(pool, 0); - int endless_loop_count=0; for(int i=from; i<=to; i++) { - if(++endless_loop_count>=MAX_LOOPS) // endless loop? - PTHROW(0, 0, - &method_name, - "endless loop detected"); vint->set_int(i); r.root->put_element(var_name, vint); Value& processed_body=r.process(body_code); - if(delim_code) { // delimiter set? + if(delim_maybe_code) { // delimiter set? const String *string=processed_body.get_string(); if(need_delim && string && string->size()) // need delim & iteration produced string? - r.write_pass_lang(r.process(*delim_code)); + r.write_pass_lang(r.process(*delim_maybe_code)); need_delim=true; } r.write_pass_lang(processed_body); @@ -205,7 +209,7 @@ static void _eval(Request& r, const Stri Value *result=r.process(expr, 0/*no name YET*/, true/*don't intercept string*/).as_expr_result(); - if(params->size()==2) { + if(params->size()>1) { Value& fmt=params->as_no_junction(1, "fmt must not be code"); Pool& pool=r.pool(); @@ -217,62 +221,64 @@ static void _eval(Request& r, const Stri r.write_no_lang(*result); } - -static void _connect(Request& r, const String&, MethodParams *params) { +static void _error(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); + const String& serror=params->as_string(0, "message must be string"); + throw Exception(0, 0, + &method_name, + "%s", serror.cstr()); +} + + +/// @todo rewrite ugly code with try/try to autoobject TempConnection +static void _connect(Request& r, const String& method_name, MethodParams *params) { + Pool& pool=r.pool(); +#ifdef RESOURCES_DEBUG +struct timeval mt[2]; +#endif Value& url=params->as_no_junction(0, "url must not be code"); Value& body_code=params->as_junction(1, "body must be code"); Table *protocol2driver_and_client= static_cast(r.classes_conf.get(r.OP.name())); +#ifdef RESOURCES_DEBUG +//measure:before +gettimeofday(&mt[0],NULL); +#endif // connect - SQL_Connection& connection=SQL_driver_manager->get_connection( - url.as_string(), protocol2driver_and_client); + SQL_Connection_ptr connection=SQL_driver_manager->get_connection( + url.as_string(), method_name, protocol2driver_and_client); - Exception rethrow_me; - // remember/set current connection - SQL_Connection *saved_connection=r.connection; - r.connection=&connection; +#ifdef RESOURCES_DEBUG +//measure:after connect +gettimeofday(&mt[1],NULL); + +double t[2]; +for(int i=0;i<2;i++) + t[i]=mt[i].tv_sec+mt[i].tv_usec/1000000.0; + +r.sql_connect_time+=t[1]-t[0]; +#endif + Temp_connection temp_connection(r, connection.get()); // execute body - bool body_failed=false; - PTRY + try { r.write_assign_lang(r.process(body_code)); - PCATCH(e) { // connect/process problem - rethrow_me=e; body_failed=true; + + } catch(...) { // process/commit problem + connection->mark_to_rollback(); + /*re*/throw; } - PEND_CATCH - - bool finalizer_failed=false; - PTRY - // FINALLY - if(body_failed) - connection.rollback(); - else - connection.commit(); - PCATCH(e) { // commit/rollback problem - rethrow_me=e; finalizer_failed=true; - } - PEND_CATCH - - // close connection [cache it] - connection.close(); - // recall current connection from remembered - r.connection=saved_connection; - - if(body_failed || finalizer_failed) // were there an exception for us to rethrow? - PTHROW(rethrow_me.type(), rethrow_me.code(), - rethrow_me.problem_source(), - rethrow_me.comment()); } +#ifndef DOXYGEN struct Switch_data { Value *searching; Value *found; Value *_default; }; - +#endif static void _switch(Request& r, const String&, MethodParams *params) { void *backup=r.classes_conf.get(*switch_data_name); Switch_data data={&r.process(params->get(0))}; @@ -291,7 +297,7 @@ static void _case(Request& r, const Stri Switch_data *data=static_cast(r.classes_conf.get(*switch_data_name)); if(!data) - PTHROW(0, 0, + throw Exception(0, 0, &method_name, "without switch"); @@ -318,6 +324,171 @@ static void _case(Request& r, const Stri } } +// cache-- + +// consts + +const int DATA_STRING_SERIALIZED_VERSION=0x0001; + +// helper types + +#ifndef DOXYGEN +struct Data_string_serialized_prolog { + int version; +}; +#endif + +void cache_delete(const String& file_spec) { + file_delete(file_spec, false/*fail_on_read_problem*/); +} + +#ifndef DOXYGEN +struct Locked_process_and_cache_put_action_info { + Request *r; + Value *body; +}; +#endif +static void locked_process_and_cache_put_action(int f, void *context) { + Locked_process_and_cache_put_action_info& info= + *static_cast(context); + + // body->process + info.body=&info.r->process(*info.body); + + // result->string + const String& data_string=info.body->as_string(); + + // string -serialize> buffer + void *data; size_t data_size; + data_string.serialize( + sizeof(Data_string_serialized_prolog), + data, data_size); + Data_string_serialized_prolog& prolog= + *static_cast(data); + prolog.version=DATA_STRING_SERIALIZED_VERSION; + + // buffer -write> file + write(f, data, data_size); +} +Value *locked_process_and_cache_put(Request& r, + Value& body_code, + const String& file_spec) { + Locked_process_and_cache_put_action_info info={ + &r, + &body_code, + }; + + return file_write_action_under_lock( + file_spec, + "cache_put", locked_process_and_cache_put_action, &info, + false/*as_text*/, + false/*do_append*/, + false/*block*/) ? info.body : 0; +} +String *cache_get(Pool& pool, const String& file_spec) { + void* data; size_t data_size; + if(!file_read(pool, file_spec, + data, data_size, + false/*as_text*/, + false/*fail_on_read_problem*/) + || !data_size/* ignore reads which are empty due to + non-unary open+lockEX conflict with lockSH */) + return 0; + + Data_string_serialized_prolog& prolog= + *static_cast(data); + + if(data_sizeas_string(0, "filespec must be string")); + if(params->size()==1) { // delete + cache_delete(file_spec); + return; + } + + time_t lifespan=(time_t)params->as_double(1, "lifespan must be number", r); + Value& body_code=params->as_junction(2, "body must be code"); + + if(lifespan) { // 'lifespan' specified? try cached copy... + size_t size; + time_t atime, mtime, ctime; + + // hence we don't hope to have unary create/lockEX + // we need some plan to live in a life like that, so... + // worst races plan: + // A B + // open + // |open + // lockSH + // |nonblocking-lockEX fails + // unlockSH + // close, cache_get returns 0 + // open + // nonblocking-lockEX succeeds; process, write, close + // |retry1: open + // ... + // |lockSH succeeds; ... + + // {file_spec} modification time + for(int retry=0; retry<2; retry++) { + if(file_stat(file_spec, size, atime, mtime, ctime, false/*no exception on error*/)) // exists? + if(time(0)-mtime > lifespan) // expired + cache_delete(file_spec); + else // not expired + if(String *cached_body=cache_get(pool, file_spec)) { // have cached copy? + // write it out + r.write_assign_lang(*cached_body); + // happy with it + return; + } + + // non-blocked lock; process; cache it + if(Value *processed_body=locked_process_and_cache_put(r, body_code, file_spec)) { + // write it out + r.write_assign_lang(*processed_body); + // happy with it + return; + } else { // somebody writing result right now + pa_sleep(0, 500000); // waiting half a second + retry=0; // prolonging our wait, than could cache_get it, without processing body_code + } + } + throw Exception(0, 0, + &file_spec, + "locking problem"); + } else { + // 'lifespan'=0, forget cached copy + cache_delete(file_spec); + // process + Value& processed_body=r.process(body_code); + // write it out + r.write_assign_lang(processed_body); + // happy with it + return; + } + // never reached +} + // constructor MOP::MOP(Pool& apool) : Methoded(apool), @@ -331,7 +502,7 @@ MOP::MOP(Pool& apool) : Methoded(apool), add_native_method("if", Method::CT_ANY, _if, 2, 3); // ^untaint[as-is|uri|sql|js|html|html-typo]{code} - add_native_method("untaint", Method::CT_ANY, _untaint, 2, 2); + add_native_method("untaint", Method::CT_ANY, _untaint, 1, 2); // ^taint[as-is|uri|sql|js|html|html-typo]{code} add_native_method("taint", Method::CT_ANY, _taint, 1, 2); @@ -340,7 +511,7 @@ MOP::MOP(Pool& apool) : Methoded(apool), add_native_method("process", Method::CT_ANY, _process, 1, 1); // ^rem{code} - add_native_method("rem", Method::CT_ANY, _rem, 1, 1000); + add_native_method("rem", Method::CT_ANY, _rem, 1, 10000); // ^while(condition){code} add_native_method("while", Method::CT_ANY, _while, 2, 2); @@ -348,24 +519,32 @@ MOP::MOP(Pool& apool) : Methoded(apool), // ^use[file] add_native_method("use", Method::CT_ANY, _use, 1, 1); - // ^for[i;from-number;to-number-inclusive]{code}[delim] + // ^for[i](from-number;to-number-inclusive){code}[delim] add_native_method("for", Method::CT_ANY, _for, 3+1, 3+1+1); // ^eval(expr) // ^eval(expr)[format] add_native_method("eval", Method::CT_ANY, _eval, 1, 2); + // ^error[msg] + add_native_method("error", Method::CT_ANY, _error, 1, 1); + // ^connect[protocol://user:pass@host[:port]/database]{code with ^sql-s} add_native_method("connect", Method::CT_ANY, _connect, 2, 2); + + // ^cache[file_spec] delete cache + // ^cache[file_spec](time){code} time=0 no cache + add_native_method("cache", Method::CT_ANY, _cache, 1, 3); + // switch // ^switch[value]{cases} add_native_method("switch", Method::CT_ANY, _switch, 2, 2); // ^case[value]{code} - add_native_method("case", Method::CT_ANY, _case, 2, 1000); + add_native_method("case", Method::CT_ANY, _case, 2, 10000); } // constructor & configurator @@ -374,7 +553,6 @@ Methoded *MOP_create(Pool& pool) { return new(pool) MOP(pool); } - void MOP::configure_user(Request& r) { Pool& pool=r.pool();