--- parser3/src/targets/cgi/parser3.C 2001/03/13 18:32:48 1.3 +++ parser3/src/targets/cgi/parser3.C 2002/11/20 13:37:23 1.201 @@ -1,91 +1,578 @@ -/* - Parser - Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) - Author: Alexander Petrosyan (http://design.ru/paf) +/** @file + Parser: scripting and CGI main. - $Id: parser3.C,v 1.3 2001/03/13 18:32:48 paf Exp $ + Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com) + Author: Alexandr Petrosian (http://paf.design.ru) */ -#include "pa_config.h" +static const char* IDENT_PARSER3_C="$Date: 2002/11/20 13:37:23 $"; -#ifdef WIN32 -# include -# include +#include "pa_config_includes.h" + +#if _MSC_VER +# include +# include #endif -#include -#include "core.h" -#include "pa_request.h" +#include "pa_sapi.h" +#include "classes.h" #include "pa_common.h" +#include "pa_request.h" +#include "pa_socks.h" +#include "pa_version.h" +#include "pool_storage.h" #ifdef WIN32 -// TODO: LONG WINAPI TopLevelExceptionFilter ( +# include +# include "getopt.h" +#else +# include #endif -int main(int argc, char *argv[]) { +//#define DEBUG_POOL_MALLOC +//#define DEBUG_STRING_APPENDS_VS_EXPANDS +//#define DEBUG_MAILRECEIVE "mailreceive.eml" + +#ifdef DEBUG_STRING_APPENDS_VS_EXPANDS +extern ulong + string_piece_appends, + wcontext_result_size, + total_alloc_size, + string_string_shortcut_economy; +#endif + +// consts + +#define REDIRECT_PREFIX "REDIRECT_" +#define PARSER_CONFIG_ENV_NAME "CGI_PARSER_CONFIG" + +/// IIS refuses to read bigger chunks +const size_t READ_POST_CHUNK_SIZE=0x400*0x400; // 1M + +static const char *argv0; +static const char *config_filespec_cstr=0; +static bool fail_on_config_read_problem=true; + +static Pool_storage global_pool_storage; ///< global pool storage +static Pool global_pool(&global_pool_storage); ///< global pool +static bool cgi; ///< we were started as CGI? +static bool mail_received=false; ///< we were started with -m option? [asked to parse incoming message to $mail:received] + +// for signal handlers +Request *request=0; + +// SAPI + +static void log(const char *fmt, va_list args) { + bool opened=false; + FILE *f=0; + + if(config_filespec_cstr) { + char beside_config_path[MAX_STRING]; + strncpy(beside_config_path, config_filespec_cstr, MAX_STRING-1); beside_config_path[MAX_STRING-1]=0; + if(!( + rsplit(beside_config_path, '/') || + rsplit(beside_config_path, '\\'))) { // strip filename + // no path, just filename + beside_config_path[0]='.'; beside_config_path[1]=0; + } + + char file_spec[MAX_STRING]; + snprintf(file_spec, MAX_STRING, + "%s/parser3.log", beside_config_path); + f=fopen(file_spec, "at"); + opened=f!=0; + } + // fallback to stderr + if(!opened) + f=stderr; + + // prefix + time_t t=time(0); + if(const char *stamp=ctime(&t)) { // never saw that + if(size_t len=strlen(stamp)) // saw once stamp being ="" + fprintf(f, "[%.*s] ", len-1, stamp); + } + // message + + char buf[MAX_STRING]; + size_t size=vsnprintf(buf, MAX_STRING, fmt, args); + remove_crlf(buf, buf+size); + + fwrite(buf, size, 1, f); + // newline + fprintf(f, "\n"); + + if(opened) + fclose(f); + else + fflush(f); +} + +// appends to parser3.log located beside my binary if openable, to stderr otherwize +void SAPI::log(Pool& , const char *fmt, ...) { + va_list args; + va_start(args,fmt); + ::log(fmt, args); + va_end(args); +} + +void SAPI::die(const char *fmt, ...) { +#ifdef DEBUG_POOL_MALLOC + extern void log_pool_stats(Pool& pool); + log_pool_stats(global_pool); +#endif + + va_list args; + va_start(args,fmt); + // log + + // logging is more important than user + // she can cancel download, we'd get SIG_PIPE, + // nothing would be logged then + ::log(fmt, args); + + // inform user + + char body[MAX_STRING]; + int content_length=vsnprintf(body, MAX_STRING, fmt, args); + + va_end(args); + + // prepare header + // let's be honest, that's bad we couldn't produce valid output + SAPI::add_header_attribute(global_pool, "status", "500"); + SAPI::add_header_attribute(global_pool, "content-type", "text/plain"); + char content_length_cstr[MAX_NUMBER]; + snprintf(content_length_cstr, sizeof(content_length_cstr), "%u", content_length); + SAPI::add_header_attribute(global_pool, "content-length", content_length_cstr); + + // send header + SAPI::send_header(global_pool); + + // body + SAPI::send_body(global_pool, body, content_length); + + exit(1); +} + +const char *SAPI::get_env(Pool& , const char *name) { + return getenv(name); +} + +const char *const *SAPI::environment(Pool&) { +#ifdef _MSC_VER + extern char **_environ; + return _environ; +#else + extern char **environ; + return environ; +#endif +} + +size_t SAPI::read_post(Pool& , char *buf, size_t max_bytes) { + size_t read_size=0; + do { + ssize_t chunk_size=read(fileno(stdin), + buf+read_size, min(READ_POST_CHUNK_SIZE, max_bytes-read_size)); + if(chunk_size<=0) + break; + read_size+=chunk_size; + } while(read_size"); +} +#endif + +#ifdef SIGPIPE +void SIGPIPE_Handler(int /*sig*/){ + SAPI::log(global_pool, "SIGPIPE received. url=", request?request->info.uri:""); + if(request) + request->interrupt(); +} +#endif + +/** +main workhorse - //TODO: SetUnhandledExceptionFilter(&TopLevelExceptionFilter); - //TODO: initSocks(); + @todo + IIS: remove trailing default-document[index.html] from $request.uri. + to do that we need to consult metabase, + wich is tested but seems slow. + IIS5 todo find out proper 'illegal call' check +*/ +static void real_parser_handler( + const char *filespec_to_process, + const char *request_method, bool header_only) { + // init socks + init_socks(global_pool); + + // init global classes + init_methoded_array(global_pool); + // init global variables + pa_globals_init(global_pool); + + // request pool, must be different ptr from global [used in VStateless_class.add_method] + Pool request_pool(&global_pool_storage); + + if(!filespec_to_process || !*filespec_to_process) + SAPI::die("Parser/%s", PARSER_VERSION); + + // Request info + Request::Info request_info; + char document_root_buf[MAX_STRING]; + if(cgi) { + if(const char *env_document_root=SAPI::get_env(request_pool, "DOCUMENT_ROOT")) + request_info.document_root=env_document_root; + else if(const char *path_info=SAPI::get_env(request_pool, "PATH_INFO")) { + // IIS + size_t len=min(sizeof(document_root_buf)-1, strlen(filespec_to_process)-strlen(path_info)); + memcpy(document_root_buf, filespec_to_process, len); document_root_buf[len]=0; + request_info.document_root=document_root_buf; + } else + throw Exception("parser.runtime", + 0, + "CGI: no PATH_INFO defined(in reinventing DOCUMENT_ROOT)"); + } else { + full_file_spec("", document_root_buf, sizeof(document_root_buf)); + request_info.document_root=document_root_buf; + } + request_info.path_translated=filespec_to_process; + request_info.method=request_method ? request_method : "GET"; + const char *query_string=SAPI::get_env(request_pool, "QUERY_STRING"); + request_info.query_string=query_string; + if(cgi) { + if(const char *env_request_uri=SAPI::get_env(request_pool, "REQUEST_URI")) + request_info.uri=env_request_uri; + else if(const char *path_info=SAPI::get_env(request_pool, "PATH_INFO")) + if(query_string) { + char *reconstructed_uri=(char *)request_pool.malloc( + strlen(path_info)+1/*'?'*/+ + strlen(query_string)+1/*0*/); + strcpy(reconstructed_uri, path_info); + strcat(reconstructed_uri, "?"); + strcat(reconstructed_uri, query_string); + request_info.uri=reconstructed_uri; + } else + request_info.uri=path_info; + else + throw Exception("parser.runtime", + 0, + "CGI: no PATH_INFO defined(in reinventing REQUEST_URI)"); + + // they've changed this under IIS5. + if(const char *script_name=SAPI::get_env(request_pool, "SCRIPT_NAME")) { + size_t script_name_len=strlen(script_name); + size_t uri_len=strlen(request_info.uri); + if(strncmp(request_info.uri,script_name, script_name_len)==0 && + script_name_len != uri_len) // under IIS they are the same + SAPI::die("CGI: illegal call"); + } + } else + request_info.uri=""; + + request_info.content_type=SAPI::get_env(request_pool, "CONTENT_TYPE"); + const char *content_length=SAPI::get_env(request_pool, "CONTENT_LENGTH"); + request_info.content_length=(content_length?atoi(content_length):0); + request_info.cookie=SAPI::get_env(request_pool, "HTTP_COOKIE"); + request_info.mail_received=mail_received; + + + // prepare to process request + Request request(request_pool, + request_info, +/*#ifdef _DEBUG + String::UL_HTML|String::UL_OPTIMIZE_BIT +#else*/ + cgi ? String::UL_HTML|String::UL_OPTIMIZE_BIT : String::UL_AS_IS +/*#endif*/ + , + true /* status_allowed */); + + // get request ptr for signal handlers + ::request=&request; +#ifdef SIGUSR1 + if(signal(SIGUSR1, SIGUSR1_Handler)==SIG_ERR) + SAPI::die("Can not set handler for SIGUSR1"); +#endif +#ifdef SIGPIPE + if(signal(SIGPIPE, SIGPIPE_Handler)==SIG_ERR) + SAPI::die("Can not set handler for SIGPIPE"); #endif + char config_filespec_buf[MAX_STRING]; + if(!config_filespec_cstr) { + const char *config_by_env=getenv(PARSER_CONFIG_ENV_NAME); + if(!config_by_env) + config_by_env=getenv(REDIRECT_PREFIX PARSER_CONFIG_ENV_NAME); + if(config_by_env) + config_filespec_cstr=config_by_env; + else { + // beside by binary + char beside_binary_path[MAX_STRING]; + strncpy(beside_binary_path, argv0, MAX_STRING-1); beside_binary_path[MAX_STRING-1]=0; // filespec of my binary + if(!( + rsplit(beside_binary_path, '/') || + rsplit(beside_binary_path, '\\'))) { // strip filename + // no path, just filename + // @todo full path, not ./! + beside_binary_path[0]='.'; beside_binary_path[1]=0; + } + snprintf(config_filespec_buf, MAX_STRING, + "%s/%s", + beside_binary_path, AUTO_FILE_NAME); + config_filespec_cstr=config_filespec_buf; + fail_on_config_read_problem=entry_exists(config_filespec_cstr); + } + } + + // process the request + request.core( + config_filespec_cstr, fail_on_config_read_problem, + header_only); + + // no request [prevent signal handlers from accessing invalid memory] + ::request=0; - Pool pool; - core(pool); + // + done_socks(); + +#ifdef DEBUG_POOL_MALLOC + extern void log_pool_stats(Pool& pool); + log_pool_stats(request_pool); +#endif + +#ifdef DEBUG_STRING_APPENDS_VS_EXPANDS + SAPI::log(global_pool, + "string piece appends=%lu, wcontext_result_size=%lu, string_string_shortcut_economy_closer=%lu, total_alloc_size=%lu", + string_piece_appends, + wcontext_result_size, + string_string_shortcut_economy, + total_alloc_size); +#endif + +} + +static void call_real_parser_handler__do_SEH( + const char *filespec_to_process, + const char *request_method, bool header_only) { +#if _MSC_VER && !defined(_DEBUG) + LPEXCEPTION_POINTERS system_exception=0; + __try { +#endif + real_parser_handler( + filespec_to_process, + request_method, header_only); + +#if _MSC_VER && !defined(_DEBUG) + } __except ( + (system_exception=GetExceptionInformation()), + EXCEPTION_EXECUTE_HANDLER) { + + if(system_exception) + if(_EXCEPTION_RECORD *er=system_exception->ExceptionRecord) + throw Exception(0, + 0, + "Exception 0x%08X at 0x%08X", er->ExceptionCode, er->ExceptionAddress); + else + throw Exception(0, 0, "Exception "); + else + throw Exception(0, 0, "Exception "); + } +#endif +} + +#if _MSC_VER +int failed_new(size_t size) { + SAPI::die("out of memory in 'new', failed to allocated %u bytes", size); + return 0; // not reached +} +#endif + +#ifdef HAVE_SET_NEW_HANDLER +static void failed_new() { + SAPI::die("out of memory in 'new'"); +} +#endif + +static void usage(const char *program) { + printf( + "Parser/%s Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)\n" + "Author: Alexandr Petrosian (http://paf.design.ru)\n" + "\n" + "Usage: %s [options] file\n" + "Options are:\n" +#ifdef WITH_MAILRECEIVE + " -m Parse mail, put received letter to $mail:received\n" +#endif + " -f config_file Use this config file (/path/to/auto.p)\n" + " -h Display usage information (this message)\n" + , PARSER_VERSION, + program); + exit(EINVAL); +} + +int main(int argc, char *argv[]) { +#ifdef DEBUG_MAILRECEIVE + if(FILE *fake_in=fopen(DEBUG_MAILRECEIVE, "rt")) { + dup2(fake_in->_file, 0/*STDIN_FILENO*/); + } +#endif + +#ifdef _DEBUG +// _crtBreakAlloc=33112; +#endif +// _asm int 3; + argv0=argv[0]; + + umask(2); // were we started as CGI? - bool cgi= + cgi= getenv("SERVER_SOFTWARE") || getenv("SERVER_NAME") || getenv("GATEWAY_INTERFACE") || getenv("REQUEST_METHOD"); + + char *raw_filespec_to_process; + if(cgi) + raw_filespec_to_process=getenv("PATH_TRANSLATED"); + else { + optind = 1; + opterr = 0; + int c; + while((c = getopt(argc, argv, "hf:" +#ifdef WITH_MAILRECEIVE + "m" +#endif + )) > 0) { + switch (c) { + case 'h': + usage(argv[0]); + break; + case 'f': + config_filespec_cstr=optarg; + break; +#ifdef WITH_MAILRECEIVE + case 'm': + mail_received=true; + break; +#endif + default: + fprintf(stderr, "%s: invalid option '%c'\n", argv[0], optopt); + usage(argv[0]); + break; + } + } + if (optind != argc - 1) { + fprintf(stderr, "%s: file not specified\n", argv[0]); + usage(argv[0]); + } + + raw_filespec_to_process=argv[optind++]; + } - // TODO: ifdef WIN32 flip \\ to / - const char *document_root="Y:/parser3/src/"; - const char *page_filespec="Y:/parser3/src/test.p"; - - // request - Request request(pool, - cgi ? String::Untaint_lang::HTML_TYPO : String::Untaint_lang::NO, - document_root, - page_filespec - ); - - bool error; - // some root-controlled location - char *sys_auto_path1; #ifdef WIN32 - sys_auto_path1=(char *)pool.malloc(MAX_STRING); - GetWindowsDirectory(sys_auto_path1, MAX_STRING-1/*for \*/); - strcat(sys_auto_path1, '\\'); -#else - sys_auto_path1=getenv("HOME"); + setmode(fileno(stdin), _O_BINARY); + setmode(fileno(stdout), _O_BINARY); + setmode(fileno(stderr), _O_BINARY); #endif + +#if _MSC_VER + _set_new_handler(failed_new); + +#ifdef _DEBUG + // Get current flag + int tmpFlag = _CrtSetDbgFlag( _CRTDBG_REPORT_FLAG ); + + // Turn on leak-checking bit + tmpFlag |= _CRTDBG_LEAK_CHECK_DF; + + // Set flag to the new value + _CrtSetDbgFlag( tmpFlag ); +// _CrtSetBreakAlloc(471); + +#endif + +#endif + +#ifdef HAVE_SET_NEW_HANDLER + std::set_new_handler(failed_new); +#endif + + char filespec_to_process[MAX_STRING]; + full_file_spec(raw_filespec_to_process, filespec_to_process, sizeof(filespec_to_process)); + + const char *request_method=getenv("REQUEST_METHOD"); + bool header_only=request_method && strcasecmp(request_method, "HEAD")==0; + + try { // global try + call_real_parser_handler__do_SEH( + filespec_to_process, + request_method, header_only); + } catch(const Exception& e) { // global problem + // don't allocate anything on pool here: + // possible pool' exception not catch-ed now + // and there could be out-of-memory exception + + SAPI::die("exception in request exception handler: %s", e.comment()); +#ifndef _DEBUG + } catch(...) { + SAPI::die(""); +#endif + } - // beside by binary - const char *sys_auto_path2=(char *)pool.malloc(MAX_STRING); - strncpy(sys_auto_path2, argv[0]); // filespec of my binary - rsplit(sys_auto_path2, '\\'); rsplit(sys_auto_path2, '/'); // strip filename - - char *result=request.core( - sys_auto_path1, - sys_auto_path2); - - if(cgi) { - const char *content_type="text/html"; - printf( - "Content-type: %s\n" - "Content-length: %d\n" - "\n", - content_type, - strlen(result)); - stdout_write(result); - } else - printf("%s", result); +#ifndef WIN32 + // + if(!cgi) + SAPI::send_body(global_pool, "\n", 1); +#endif +//_asm int 3; return 0; }