--- parser3/src/targets/cgi/parser3.C 2002/11/20 13:37:23 1.201 +++ parser3/src/targets/cgi/parser3.C 2019/12/25 22:01:03 1.280 @@ -1,85 +1,93 @@ /** @file Parser: scripting and CGI main. - Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com) + Copyright (c) 2001-2017 Art. Lebedev Studio (http://www.artlebedev.com) Author: Alexandr Petrosian (http://paf.design.ru) */ -static const char* IDENT_PARSER3_C="$Date: 2002/11/20 13:37:23 $"; +volatile const char * IDENT_PARSER3_C="$Id: parser3.C,v 1.280 2019/12/25 22:01:03 moko Exp $"; #include "pa_config_includes.h" -#if _MSC_VER -# include -# include -#endif - #include "pa_sapi.h" #include "classes.h" #include "pa_common.h" #include "pa_request.h" -#include "pa_socks.h" #include "pa_version.h" -#include "pool_storage.h" +#include "pa_vconsole.h" -#ifdef WIN32 -# include -# include "getopt.h" -#else -# include +#ifdef _MSC_VER +#include +#include +#include #endif -//#define DEBUG_POOL_MALLOC -//#define DEBUG_STRING_APPENDS_VS_EXPANDS -//#define DEBUG_MAILRECEIVE "mailreceive.eml" - -#ifdef DEBUG_STRING_APPENDS_VS_EXPANDS -extern ulong - string_piece_appends, - wcontext_result_size, - total_alloc_size, - string_string_shortcut_economy; +// defines + +// comment remove me after debugging +//#define PA_DEBUG_CGI_ENTRY_EXIT "c:\\parser\\debug-parser3.log" + +#if defined(_MSC_VER) && !defined(_DEBUG) +# define PA_SUPPRESS_SYSTEM_EXCEPTION #endif // consts #define REDIRECT_PREFIX "REDIRECT_" #define PARSER_CONFIG_ENV_NAME "CGI_PARSER_CONFIG" +#define PARSER_LOG_ENV_NAME "CGI_PARSER_LOG" /// IIS refuses to read bigger chunks -const size_t READ_POST_CHUNK_SIZE=0x400*0x400; // 1M +const size_t READ_POST_CHUNK_SIZE=0x400*0x400; // 1M -static const char *argv0; -static const char *config_filespec_cstr=0; +static const char* argv0; +static const char* config_filespec_cstr=0; static bool fail_on_config_read_problem=true; -static Pool_storage global_pool_storage; ///< global pool storage -static Pool global_pool(&global_pool_storage); ///< global pool +static int args_skip=1; +static char** argv_all = NULL; + static bool cgi; ///< we were started as CGI? static bool mail_received=false; ///< we were started with -m option? [asked to parse incoming message to $mail:received] // for signal handlers Request *request=0; +Request_info *request_info=0; +bool execution_canceled=false; // SAPI -static void log(const char *fmt, va_list args) { +class SAPI_Info { +public: + int http_response_code; +} SAPI_info = { 0 }; + +static void log(const char* fmt, va_list args) { bool opened=false; FILE *f=0; - if(config_filespec_cstr) { + const char* log_by_env=getenv(PARSER_LOG_ENV_NAME); + if(!log_by_env) + log_by_env=getenv(REDIRECT_PREFIX PARSER_LOG_ENV_NAME); + if(log_by_env) { + f=fopen(log_by_env, "at"); + opened=f!=0; + } +#ifdef PA_DEBUG_CGI_ENTRY_EXIT + f=fopen(PA_DEBUG_CGI_ENTRY_EXIT, "at"); + opened=f!=0; +#endif + + if(!opened && config_filespec_cstr) { char beside_config_path[MAX_STRING]; strncpy(beside_config_path, config_filespec_cstr, MAX_STRING-1); beside_config_path[MAX_STRING-1]=0; - if(!( - rsplit(beside_config_path, '/') || - rsplit(beside_config_path, '\\'))) { // strip filename + if(!(rsplit(beside_config_path, '/') || rsplit(beside_config_path, '\\'))) { // strip filename // no path, just filename beside_config_path[0]='.'; beside_config_path[1]=0; } char file_spec[MAX_STRING]; - snprintf(file_spec, MAX_STRING, - "%s/parser3.log", beside_config_path); + snprintf(file_spec, MAX_STRING, "%s/parser3.log", beside_config_path); f=fopen(file_spec, "at"); opened=f!=0; } @@ -87,21 +95,32 @@ static void log(const char *fmt, va_list if(!opened) f=stderr; + // use no memory [so that we could log out-of-memory error] + setbuf(f, 0); // stderr stream is unbuffered by default, but still... + // prefix time_t t=time(0); - if(const char *stamp=ctime(&t)) { // never saw that + if(const char* stamp=ctime(&t)) { // never saw that if(size_t len=strlen(stamp)) // saw once stamp being ="" - fprintf(f, "[%.*s] ", len-1, stamp); + fprintf(f, "[%.*s] [%u] ", (int)len-1, stamp, (unsigned int)getpid() ); } // message - char buf[MAX_STRING]; - size_t size=vsnprintf(buf, MAX_STRING, fmt, args); - remove_crlf(buf, buf+size); - + char buf[MAX_LOG_STRING]; + size_t size=vsnprintf(buf, MAX_LOG_STRING, fmt, args); + size=remove_crlf(buf, buf+size); fwrite(buf, size, 1, f); + + if(request_info) + fprintf(f, " [uri=%s, method=%s, cl=%lu]", + request_info->uri? request_info->uri: "", + request_info->method? request_info->method: "", + request_info->content_length); + else + fputs(" [no request info]", f); + // newline - fprintf(f, "\n"); + fputs("\n", f); if(opened) fclose(f); @@ -109,58 +128,91 @@ static void log(const char *fmt, va_list fflush(f); } -// appends to parser3.log located beside my binary if openable, to stderr otherwize -void SAPI::log(Pool& , const char *fmt, ...) { - va_list args; +#ifdef PA_DEBUG_CGI_ENTRY_EXIT +static void log(const char* fmt, ...) { + va_list args; va_start(args,fmt); - ::log(fmt, args); + log(fmt, args); va_end(args); } - -void SAPI::die(const char *fmt, ...) { -#ifdef DEBUG_POOL_MALLOC - extern void log_pool_stats(Pool& pool); - log_pool_stats(global_pool); #endif - va_list args; +// appends to parser3.log located beside my binary if openable, to stderr otherwize +void SAPI::log(SAPI_Info&, const char* fmt, ...) { + va_list args; va_start(args,fmt); - // log - - // logging is more important than user - // she can cancel download, we'd get SIG_PIPE, - // nothing would be logged then ::log(fmt, args); + va_end(args); +} +static void die_or_abort(const char* fmt, va_list args, bool write_core) { // inform user char body[MAX_STRING]; int content_length=vsnprintf(body, MAX_STRING, fmt, args); - va_end(args); - // prepare header // let's be honest, that's bad we couldn't produce valid output - SAPI::add_header_attribute(global_pool, "status", "500"); - SAPI::add_header_attribute(global_pool, "content-type", "text/plain"); + // capitalized headers passed for preventing malloc during capitalization + SAPI::add_header_attribute(SAPI_info, HTTP_STATUS_CAPITALIZED, "500"); + SAPI::add_header_attribute(SAPI_info, HTTP_CONTENT_TYPE_CAPITALIZED, "text/plain"); + // don't use 'format' function because it calls malloc char content_length_cstr[MAX_NUMBER]; snprintf(content_length_cstr, sizeof(content_length_cstr), "%u", content_length); - SAPI::add_header_attribute(global_pool, "content-length", content_length_cstr); + SAPI::add_header_attribute(SAPI_info, HTTP_CONTENT_LENGTH_CAPITALIZED, content_length_cstr); // send header - SAPI::send_header(global_pool); + SAPI::send_header(SAPI_info); // body - SAPI::send_body(global_pool, body, content_length); + SAPI::send_body(SAPI_info, body, content_length); + + // exit & try to produce core dump[unix] or invoke debugger[Win32 Debug version] + if(write_core) { +#ifdef WIN32 + // IIS with abort failes to show STDOUT, it just barks "abnormal program termination" + exit(1); +#else + abort(); +#endif + } else + exit(1); +} + +void SAPI::die(const char* fmt, ...) { + va_list args; + + // logging first, can't log inside die_or_abort due to vsnprintf (bug #106) + va_start(args,fmt); + ::log(fmt, args); + va_end(args); + + va_start(args, fmt); + die_or_abort(fmt, args, false /*write core?*/); +// va_end(args); +} + +void SAPI::abort(const char* fmt, ...) { + va_list args; + + // logging first, can't log inside die_or_abort due to vsnprintf (bug #106) + va_start(args,fmt); + ::log(fmt, args); + va_end(args); - exit(1); + va_start(args, fmt); + die_or_abort(fmt, args, true /*write core?*/); +// va_end(args); } -const char *SAPI::get_env(Pool& , const char *name) { - return getenv(name); +char* SAPI::Env::get(SAPI_Info& , const char* name) { + if(char *local=getenv(name)) + return pa_strdup(local); + else + return 0; } -const char *const *SAPI::environment(Pool&) { +const char* const *SAPI::Env::get(SAPI_Info&) { #ifdef _MSC_VER extern char **_environ; return _environ; @@ -170,11 +222,10 @@ const char *const *SAPI::environment(Poo #endif } -size_t SAPI::read_post(Pool& , char *buf, size_t max_bytes) { +size_t SAPI::read_post(SAPI_Info& , char *buf, size_t max_bytes) { size_t read_size=0; do { - ssize_t chunk_size=read(fileno(stdin), - buf+read_size, min(READ_POST_CHUNK_SIZE, max_bytes-read_size)); + ssize_t chunk_size=read(fileno(stdin), buf+read_size, min(READ_POST_CHUNK_SIZE, max_bytes-read_size)); if(chunk_size<=0) break; read_size+=chunk_size; @@ -183,38 +234,34 @@ size_t SAPI::read_post(Pool& , char *buf return read_size; } -void SAPI::add_header_attribute(Pool& , const char *key, const char *value) { - if(cgi) - printf("%s: %s\n", key, value); +void SAPI::add_header_attribute(SAPI_Info& , const char* dont_store_key, const char* dont_store_value) { + if(strcasecmp(dont_store_key, HTTP_STATUS)==0) + SAPI_info.http_response_code=atoi(dont_store_value); + if( cgi && (!request || !request->console.was_used()) ) + printf("%s: %s\n", capitalize(dont_store_key), dont_store_value); } -/// @todo intelligent cache-control -void SAPI::send_header(Pool& ) { +void SAPI::send_header(SAPI_Info& ) { if(cgi) { -// puts("expires: Fri, 23 Mar 2001 09:32:23 GMT"); - - // header | body delimiter puts(""); } } -void SAPI::send_body(Pool& , const void *buf, size_t size) { - stdout_write(buf, size); +size_t SAPI::send_body(SAPI_Info& , const void *buf, size_t size) { + return stdout_write(buf, size); } -// - -static void full_file_spec(const char *file_name, char *buf, size_t buf_size) { +static void full_file_spec(const char* file_name, char *buf, size_t buf_size) { if(file_name) if(file_name[0]=='/' #ifdef WIN32 - || (file_name[0] && file_name[1]==':') + || file_name[0] && file_name[1]==':' #endif - ) - strncpy(buf, file_name, buf_size); - else { - char cwd[MAX_STRING]; getcwd(cwd, MAX_STRING); - snprintf(buf, buf_size, "%s/%s", cwd, file_name); + ){ + strncpy(buf, file_name, buf_size-1); buf[buf_size-1]=0; + } else { + char cwd[MAX_STRING]; + snprintf(buf, buf_size, "%s/%s", getcwd(cwd, MAX_STRING) ? cwd : "", file_name); } else buf[0]=0; @@ -223,226 +270,301 @@ static void full_file_spec(const char *f #endif } +static void log_signal(const char* signal_name) { + if(request_info) + SAPI::log(SAPI_info, "%s received while %s. uri=%s, method=%s, cl=%u", + signal_name, + request ? "executing code" : "reading data", + request_info->uri, + request_info->method, + request_info->content_length); + else + SAPI::log(SAPI_info, "%s received before or after processing request", + signal_name); +} + #ifdef SIGUSR1 -void SIGUSR1_Handler(int /*sig*/){ - SAPI::log(global_pool, "SIGUSR1 received. url=", request?request->info.uri:""); +static void SIGUSR1_handler(int /*sig*/){ + log_signal("SIGUSR1"); } #endif #ifdef SIGPIPE -void SIGPIPE_Handler(int /*sig*/){ - SAPI::log(global_pool, "SIGPIPE received. url=", request?request->info.uri:""); +#define SIGPIPE_NAME "SIGPIPE" +static const String sigpipe_name(SIGPIPE_NAME); +static void SIGPIPE_handler(int /*sig*/){ + Value* sigpipe=0; + if(request) + sigpipe=request->main_class.get_element(sigpipe_name); + if(sigpipe && sigpipe->as_bool()) + log_signal(SIGPIPE_NAME); + + execution_canceled=true; if(request) - request->interrupt(); + request->set_skip(Request::SKIP_INTERRUPTED); } #endif +#ifdef WIN32 +const char* maybe_reconstruct_IIS_status_in_qs(const char* original) +{ + // 404;http://servername/page[?param=value...] + // ';' should be urlencoded by HTTP standard, so we shouldn't get it from browser + // and can consider that as an indication that this is IIS way to report errors + + if(original && isdigit((unsigned char)original[0]) && isdigit((unsigned char)original[1]) && isdigit((unsigned char)original[2]) && original[3]==';'){ + size_t original_len=strlen(original); + char* reconstructed=new(PointerFreeGC) char[original_len +12/*IIS-STATUS=&*/ +14/*IIS-DOCUMENT=&*/ +1]; + char* cur=reconstructed; + memcpy(cur, "IIS-STATUS=", 11); cur+=11; + memcpy(cur, original, 3); cur+=3; + *cur++='&'; + + const char* qmark_at=strchr(original, '?'); + memcpy(cur, "IIS-DOCUMENT=", 13); cur+=13; + { + size_t value_len=(qmark_at ? qmark_at-original : original_len)-4; + memcpy(cur, original+4, value_len); cur+=value_len; + } + + if(qmark_at) { + *cur++='&'; + strcpy(cur, qmark_at+1/*skip ? itself*/); + } else + *cur=0; + + return reconstructed; + } + + return original; +} +#endif + + +class RequestController { +public: + RequestController(Request* r){ + ::request=r; + } + ~RequestController(){ + ::request=0; + } +}; + + /** main workhorse - @todo - IIS: remove trailing default-document[index.html] from $request.uri. - to do that we need to consult metabase, - wich is tested but seems slow. - IIS5 todo find out proper 'illegal call' check + @todo + IIS: remove trailing default-document[index.html] from $request.uri. + to do that we need to consult metabase, + wich is tested but seems slow. */ -static void real_parser_handler( - const char *filespec_to_process, - const char *request_method, bool header_only) { - // init socks - init_socks(global_pool); - - // init global classes - init_methoded_array(global_pool); - // init global variables - pa_globals_init(global_pool); - - // request pool, must be different ptr from global [used in VStateless_class.add_method] - Pool request_pool(&global_pool_storage); +static void real_parser_handler(const char* filespec_to_process, const char* request_method, bool header_only) { + // init libraries + pa_globals_init(); + if(!filespec_to_process || !*filespec_to_process) - SAPI::die("Parser/%s", PARSER_VERSION); + SAPI::die("Parser/%s" +#ifdef PA_DEBUG_CGI_ENTRY_EXIT + " with entry/exit tracing" +#endif + , PARSER_VERSION); // Request info - Request::Info request_info; + Request_info request_info; memset(&request_info, 0, sizeof(request_info)); char document_root_buf[MAX_STRING]; if(cgi) { - if(const char *env_document_root=SAPI::get_env(request_pool, "DOCUMENT_ROOT")) + if(const char* env_document_root=getenv("DOCUMENT_ROOT")) request_info.document_root=env_document_root; - else if(const char *path_info=SAPI::get_env(request_pool, "PATH_INFO")) { + else if(const char* path_info=getenv("PATH_INFO")) { // IIS size_t len=min(sizeof(document_root_buf)-1, strlen(filespec_to_process)-strlen(path_info)); memcpy(document_root_buf, filespec_to_process, len); document_root_buf[len]=0; request_info.document_root=document_root_buf; } else - throw Exception("parser.runtime", - 0, - "CGI: no PATH_INFO defined(in reinventing DOCUMENT_ROOT)"); + throw Exception(PARSER_RUNTIME, 0, "CGI: no PATH_INFO defined(in reinventing DOCUMENT_ROOT)"); } else { full_file_spec("", document_root_buf, sizeof(document_root_buf)); request_info.document_root=document_root_buf; } request_info.path_translated=filespec_to_process; request_info.method=request_method ? request_method : "GET"; - const char *query_string=SAPI::get_env(request_pool, "QUERY_STRING"); + const char* query_string= +#ifdef WIN32 + maybe_reconstruct_IIS_status_in_qs +#endif + (getenv("QUERY_STRING")); request_info.query_string=query_string; if(cgi) { - if(const char *env_request_uri=SAPI::get_env(request_pool, "REQUEST_URI")) + // few absolute obligatory + const char* path_info=getenv("PATH_INFO"); + if(!path_info) + SAPI::die("CGI: illegal call (missing PATH_INFO)"); + const char* script_name=getenv("SCRIPT_NAME"); + if(!script_name) + SAPI::die("CGI: illegal call (missing SCRIPT_NAME)"); + + const char* env_request_uri=request_info.strip_absolute_uri(getenv("REQUEST_URI")); + if(env_request_uri) request_info.uri=env_request_uri; - else if(const char *path_info=SAPI::get_env(request_pool, "PATH_INFO")) + else if(query_string) { - char *reconstructed_uri=(char *)request_pool.malloc( - strlen(path_info)+1/*'?'*/+ - strlen(query_string)+1/*0*/); + char* reconstructed_uri=new(PointerFreeGC) char[strlen(path_info) + 1/*'?'*/+ strlen(query_string) + 1/*0*/]; strcpy(reconstructed_uri, path_info); strcat(reconstructed_uri, "?"); strcat(reconstructed_uri, query_string); request_info.uri=reconstructed_uri; } else request_info.uri=path_info; - else - throw Exception("parser.runtime", - 0, - "CGI: no PATH_INFO defined(in reinventing REQUEST_URI)"); - - // they've changed this under IIS5. - if(const char *script_name=SAPI::get_env(request_pool, "SCRIPT_NAME")) { - size_t script_name_len=strlen(script_name); - size_t uri_len=strlen(request_info.uri); - if(strncmp(request_info.uri,script_name, script_name_len)==0 && - script_name_len != uri_len) // under IIS they are the same - SAPI::die("CGI: illegal call"); - } + + if(env_request_uri) { // apache & others stuck to standards + /* + http://parser3/env.html?123 =OK + $request:uri=/env.html?123 + REQUEST_URI='/env.html?123' + SCRIPT_NAME='/cgi-bin/parser3' + PATH_INFO='/env.html' + + http://parser3/cgi-bin/parser3/env.html?123 =ERROR + $request:uri=/cgi-bin/parser3/env.html?123 + REQUEST_URI='/cgi-bin/parser3/env.html?123' + SCRIPT_NAME='/cgi-bin/parser3' + PATH_INFO='/env.html' + */ + size_t script_name_len=strlen(script_name); + size_t uri_len=strlen(env_request_uri); + if(strncmp(env_request_uri, script_name, script_name_len)==0 && script_name_len != uri_len) // under IIS they are the same + SAPI::die("CGI: illegal call (1)"); + } else { // seen on IIS5 + /* + http://nestle/env.html?123 =OK + $request:uri=/env.html?123 + REQUEST_URI='' + SCRIPT_NAME='/env.html' + PATH_INFO='/env.html' + + http://nestle/cgi-bin/parser3.exe/env.html =ERROR + $request:uri=/env.html + REQUEST_URI='' + SCRIPT_NAME='/cgi-bin/parser3.exe' + PATH_INFO='/env.html' + */ + if(strcmp(script_name, path_info)!=0) + SAPI::die("CGI: illegal call (2)"); + } } else request_info.uri=""; - request_info.content_type=SAPI::get_env(request_pool, "CONTENT_TYPE"); - const char *content_length=SAPI::get_env(request_pool, "CONTENT_LENGTH"); + request_info.content_type=getenv("CONTENT_TYPE"); + const char* content_length=getenv("CONTENT_LENGTH"); request_info.content_length=(content_length?atoi(content_length):0); - request_info.cookie=SAPI::get_env(request_pool, "HTTP_COOKIE"); + request_info.cookie=getenv("HTTP_COOKIE"); request_info.mail_received=mail_received; + request_info.argv=argv_all; + request_info.args_skip=args_skip; - // prepare to process request - Request request(request_pool, - request_info, -/*#ifdef _DEBUG - String::UL_HTML|String::UL_OPTIMIZE_BIT -#else*/ - cgi ? String::UL_HTML|String::UL_OPTIMIZE_BIT : String::UL_AS_IS -/*#endif*/ - , - true /* status_allowed */); - - // get request ptr for signal handlers - ::request=&request; -#ifdef SIGUSR1 - if(signal(SIGUSR1, SIGUSR1_Handler)==SIG_ERR) - SAPI::die("Can not set handler for SIGUSR1"); -#endif -#ifdef SIGPIPE - if(signal(SIGPIPE, SIGPIPE_Handler)==SIG_ERR) - SAPI::die("Can not set handler for SIGPIPE"); + // get request_info ptr for signal handlers + ::request_info=&request_info; + if(execution_canceled) + SAPI::die("Execution canceled"); + +#ifdef PA_DEBUG_CGI_ENTRY_EXIT + log("request_info: method=%s, uri=%s, q=%s, dr=%s, pt=%s, cookies=%s, cl=%u", + request_info.method, + request_info.uri, + request_info.query_string, + request_info.document_root, + request_info.path_translated, + request_info.cookie, + request_info.content_length); #endif - char config_filespec_buf[MAX_STRING]; - if(!config_filespec_cstr) { - const char *config_by_env=getenv(PARSER_CONFIG_ENV_NAME); - if(!config_by_env) - config_by_env=getenv(REDIRECT_PREFIX PARSER_CONFIG_ENV_NAME); - if(config_by_env) - config_filespec_cstr=config_by_env; - else { - // beside by binary - char beside_binary_path[MAX_STRING]; - strncpy(beside_binary_path, argv0, MAX_STRING-1); beside_binary_path[MAX_STRING-1]=0; // filespec of my binary - if(!( - rsplit(beside_binary_path, '/') || - rsplit(beside_binary_path, '\\'))) { // strip filename - // no path, just filename - // @todo full path, not ./! - beside_binary_path[0]='.'; beside_binary_path[1]=0; + // prepare to process request + Request request(SAPI_info, request_info, cgi ? String::Language(String::L_HTML|String::L_OPTIMIZE_BIT) : String::L_AS_IS); + + { + // get ::request ptr for signal handlers + RequestController rc(&request); + + char config_filespec_buf[MAX_STRING]; + if(!config_filespec_cstr) { + const char* config_by_env=getenv(PARSER_CONFIG_ENV_NAME); + if(!config_by_env) + config_by_env=getenv(REDIRECT_PREFIX PARSER_CONFIG_ENV_NAME); + if(config_by_env) + config_filespec_cstr=config_by_env; + else { + // beside by binary + char beside_binary_path[MAX_STRING]; + strncpy(beside_binary_path, argv0, MAX_STRING-1); beside_binary_path[MAX_STRING-1]=0; // filespec of my binary + if(!(rsplit(beside_binary_path, '/') || rsplit(beside_binary_path, '\\'))) { // strip filename + // no path, just filename + // @todo full path, not ./! + beside_binary_path[0]='.'; beside_binary_path[1]=0; + } + snprintf(config_filespec_buf, MAX_STRING, "%s/%s", beside_binary_path, AUTO_FILE_NAME); + config_filespec_cstr=config_filespec_buf; + fail_on_config_read_problem=entry_exists(config_filespec_cstr); } - snprintf(config_filespec_buf, MAX_STRING, - "%s/%s", - beside_binary_path, AUTO_FILE_NAME); - config_filespec_cstr=config_filespec_buf; - fail_on_config_read_problem=entry_exists(config_filespec_cstr); } + + // process the request + request.core(config_filespec_cstr, fail_on_config_read_problem, header_only); + + // ::request cleared in RequestController desctructor to prevent signal handlers from accessing invalid memory } - - // process the request - request.core( - config_filespec_cstr, fail_on_config_read_problem, - header_only); - // no request [prevent signal handlers from accessing invalid memory] - ::request=0; - - // - done_socks(); - -#ifdef DEBUG_POOL_MALLOC - extern void log_pool_stats(Pool& pool); - log_pool_stats(request_pool); -#endif + // finalize libraries + pa_globals_done(); +} -#ifdef DEBUG_STRING_APPENDS_VS_EXPANDS - SAPI::log(global_pool, - "string piece appends=%lu, wcontext_result_size=%lu, string_string_shortcut_economy_closer=%lu, total_alloc_size=%lu", - string_piece_appends, - wcontext_result_size, - string_string_shortcut_economy, - total_alloc_size); -#endif +#ifdef PA_SUPPRESS_SYSTEM_EXCEPTION +static const Exception call_real_parser_handler__do_PEH_return_it(const char* filespec_to_process, const char* request_method, bool header_only){ + try { + real_parser_handler(filespec_to_process, request_method, header_only); + } catch(const Exception& e) { + return e; + } + return Exception(); } -static void call_real_parser_handler__do_SEH( - const char *filespec_to_process, - const char *request_method, bool header_only) { -#if _MSC_VER && !defined(_DEBUG) +static void call_real_parser_handler__supress_system_exception(const char* filespec_to_process, const char* request_method, bool header_only){ + Exception parser_exception; LPEXCEPTION_POINTERS system_exception=0; + __try { -#endif - real_parser_handler( - filespec_to_process, - request_method, header_only); - -#if _MSC_VER && !defined(_DEBUG) + parser_exception=call_real_parser_handler__do_PEH_return_it(filespec_to_process, request_method, header_only); } __except ( (system_exception=GetExceptionInformation()), - EXCEPTION_EXECUTE_HANDLER) { - + EXCEPTION_EXECUTE_HANDLER) + { + if(system_exception) if(_EXCEPTION_RECORD *er=system_exception->ExceptionRecord) - throw Exception(0, - 0, - "Exception 0x%08X at 0x%08X", er->ExceptionCode, er->ExceptionAddress); - else - throw Exception(0, 0, "Exception "); + throw Exception("system", 0, "0x%08X at 0x%08X", er->ExceptionCode, er->ExceptionAddress); else - throw Exception(0, 0, "Exception "); + throw Exception("system", 0, ""); + else + throw Exception("system", 0, ""); } -#endif -} -#if _MSC_VER -int failed_new(size_t size) { - SAPI::die("out of memory in 'new', failed to allocated %u bytes", size); - return 0; // not reached + if(parser_exception) + throw Exception(parser_exception); } -#endif -#ifdef HAVE_SET_NEW_HANDLER -static void failed_new() { - SAPI::die("out of memory in 'new'"); -} +#define REAL_PARSER_HANDLER call_real_parser_handler__supress_system_exception +#else +#define REAL_PARSER_HANDLER real_parser_handler #endif -static void usage(const char *program) { +static void usage(const char* program) { printf( - "Parser/%s Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)\n" + "Parser/%s\n" + "Copyright (c) 2001-2017 Art. Lebedev Studio (http://www.artlebedev.com)\n" "Author: Alexandr Petrosian (http://paf.design.ru)\n" "\n" "Usage: %s [options] file\n" @@ -451,82 +573,95 @@ static void usage(const char *program) { " -m Parse mail, put received letter to $mail:received\n" #endif " -f config_file Use this config file (/path/to/auto.p)\n" - " -h Display usage information (this message)\n" - , PARSER_VERSION, + " -h Display usage information (this message)\n", + PARSER_VERSION, program); exit(EINVAL); } int main(int argc, char *argv[]) { -#ifdef DEBUG_MAILRECEIVE - if(FILE *fake_in=fopen(DEBUG_MAILRECEIVE, "rt")) { - dup2(fake_in->_file, 0/*STDIN_FILENO*/); - } +#ifdef PA_DEBUG_CGI_ENTRY_EXIT + log("main: entry"); #endif -#ifdef _DEBUG -// _crtBreakAlloc=33112; +#ifndef PA_DEBUG_DISABLE_GC + GC_java_finalization=0; + // Dont collect unless explicitly requested + // this is quicker (~30% ), but less memory-efficient(~8%) + // so deciding for speed + GC_dont_gc=1; +#endif + +#ifdef SIGUSR1 + if(signal(SIGUSR1, SIGUSR1_handler)==SIG_ERR) + SAPI::die("Can not set handler for SIGUSR1"); #endif -// _asm int 3; +#ifdef SIGPIPE + if(signal(SIGPIPE, SIGPIPE_handler)==SIG_ERR) + SAPI::die("Can not set handler for SIGPIPE"); +#endif + + argv_all=argv; argv0=argv[0]; umask(2); // were we started as CGI? - cgi= - getenv("SERVER_SOFTWARE") || - getenv("SERVER_NAME") || - getenv("GATEWAY_INTERFACE") || - getenv("REQUEST_METHOD"); - + cgi=(getenv("SERVER_SOFTWARE") || getenv("SERVER_NAME") || getenv("GATEWAY_INTERFACE") || getenv("REQUEST_METHOD")) && !getenv("PARSER_VERSION"); + char *raw_filespec_to_process; - if(cgi) + if(cgi) { raw_filespec_to_process=getenv("PATH_TRANSLATED"); - else { - optind = 1; - opterr = 0; - int c; - while((c = getopt(argc, argv, "hf:" -#ifdef WITH_MAILRECEIVE - "m" -#endif - )) > 0) { - switch (c) { - case 'h': - usage(argv[0]); - break; - case 'f': - config_filespec_cstr=optarg; + if(raw_filespec_to_process && !*raw_filespec_to_process) + raw_filespec_to_process=0; + } else { + int optind=1; + while(optind < argc){ + char *carg = argv[optind]; + if(carg[0] != '-') break; + + for(size_t k = 1; k < strlen(carg); k++){ + char c = carg[k]; + switch (c) { + case 'h': + usage(argv[0]); + break; + case 'f': + if(optind < argc - 1){ + optind++; + config_filespec_cstr=argv[optind]; + } + break; #ifdef WITH_MAILRECEIVE - case 'm': - mail_received=true; - break; -#endif - default: - fprintf(stderr, "%s: invalid option '%c'\n", argv[0], optopt); - usage(argv[0]); - break; + case 'm': + mail_received=true; + break; +#endif + default: + fprintf(stderr, "%s: invalid option '%c'\n", argv[0], c); + usage(argv[0]); + break; + } } + optind++; } - if (optind != argc - 1) { + + if (optind > argc - 1) { fprintf(stderr, "%s: file not specified\n", argv[0]); usage(argv[0]); } - - raw_filespec_to_process=argv[optind++]; + raw_filespec_to_process=argv[optind]; + args_skip=optind; } -#ifdef WIN32 +#ifdef _MSC_VER setmode(fileno(stdin), _O_BINARY); setmode(fileno(stdout), _O_BINARY); setmode(fileno(stderr), _O_BINARY); #endif -#if _MSC_VER - _set_new_handler(failed_new); - -#ifdef _DEBUG +#if defined(_MSC_VER) && defined(_DEBUG) // Get current flag int tmpFlag = _CrtSetDbgFlag( _CRTDBG_REPORT_FLAG ); @@ -535,44 +670,51 @@ int main(int argc, char *argv[]) { // Set flag to the new value _CrtSetDbgFlag( tmpFlag ); -// _CrtSetBreakAlloc(471); - -#endif -#endif - -#ifdef HAVE_SET_NEW_HANDLER - std::set_new_handler(failed_new); + _CrtSetReportMode( _CRT_WARN, _CRTDBG_MODE_FILE ); + _CrtSetReportFile( _CRT_WARN, _CRTDBG_FILE_STDERR ); #endif char filespec_to_process[MAX_STRING]; full_file_spec(raw_filespec_to_process, filespec_to_process, sizeof(filespec_to_process)); - const char *request_method=getenv("REQUEST_METHOD"); + const char* request_method=getenv("REQUEST_METHOD"); bool header_only=request_method && strcasecmp(request_method, "HEAD")==0; try { // global try - call_real_parser_handler__do_SEH( - filespec_to_process, - request_method, header_only); + REAL_PARSER_HANDLER(filespec_to_process, request_method, header_only); } catch(const Exception& e) { // global problem // don't allocate anything on pool here: // possible pool' exception not catch-ed now // and there could be out-of-memory exception + char buf[MAX_STRING]; + snprintf(buf, MAX_STRING, "Unhandled exception %s", e.comment()); + // log it + SAPI::log(SAPI_info, "%s", buf); + + // + int content_length=strlen(buf); + + // prepare header + // capitalized headers are used for preventing malloc during capitalization + SAPI::add_header_attribute(SAPI_info, HTTP_CONTENT_TYPE_CAPITALIZED, "text/plain"); + // don't use 'format' function because it calls malloc + char content_length_cstr[MAX_NUMBER]; + snprintf(content_length_cstr, MAX_NUMBER, "%u", content_length); + SAPI::add_header_attribute(SAPI_info, HTTP_CONTENT_LENGTH_CAPITALIZED, content_length_cstr); + + // send header + SAPI::send_header(SAPI_info); + + // send body + if(!header_only) + SAPI::send_body(SAPI_info, buf, content_length); - SAPI::die("exception in request exception handler: %s", e.comment()); -#ifndef _DEBUG - } catch(...) { - SAPI::die(""); -#endif + // unsuccessful finish } - -#ifndef WIN32 - // - if(!cgi) - SAPI::send_body(global_pool, "\n", 1); +#ifdef PA_DEBUG_CGI_ENTRY_EXIT + log("main: successful return"); #endif -//_asm int 3; - return 0; + return SAPI_info.http_response_code < 100 ? SAPI_info.http_response_code : 0; }