Annotation of parser3/src/targets/cgi/parser3.C, revision 1.194
1.27 paf 1: /** @file
2: Parser: scripting and CGI main.
3:
1.155 paf 4: Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)
1.154 paf 5: Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)
1.189 paf 6: */
1.27 paf 7:
1.194 ! paf 8: static const char* IDENT_PARSER3_C="$Date: 2002/08/14 10:52:28 $";
1.1 paf 9:
1.40 paf 10: #include "pa_config_includes.h"
1.3 paf 11:
1.139 paf 12: #if _MSC_VER
1.131 paf 13: # include <new.h>
1.148 paf 14: # include <crtdbg.h>
1.3 paf 15: #endif
1.27 paf 16:
1.37 paf 17: #include "pa_sapi.h"
1.76 paf 18: #include "classes.h"
1.24 paf 19: #include "pa_common.h"
1.2 paf 20: #include "pa_request.h"
1.57 paf 21: #include "pa_socks.h"
1.68 paf 22: #include "pa_version.h"
1.125 parser 23: #include "pool_storage.h"
1.69 paf 24:
1.149 paf 25: #ifdef WIN32
26: # include <windows.h>
1.184 paf 27: # include "getopt.h"
28: #else
29: # include <getopt.h>
1.120 parser 30: #endif
31:
1.194 ! paf 32: #include "fixopt.h"
! 33:
1.158 paf 34: //#define DEBUG_POOL_MALLOC
1.162 paf 35: //#define DEBUG_STRING_APPENDS_VS_EXPANDS
1.191 paf 36: //#define DEBUG_MAILRECEIVE "test.eml"
1.160 paf 37:
38: #ifdef DEBUG_STRING_APPENDS_VS_EXPANDS
39: extern ulong
40: string_piece_appends,
41: wcontext_result_size,
42: total_alloc_size,
43: string_string_shortcut_economy;
44: #endif
1.84 parser 45:
1.109 parser 46: // consts
1.84 parser 47:
1.175 paf 48: #define REDIRECT_PREFIX "REDIRECT_"
1.181 paf 49: #define PARSER_CONFIG_ENV_NAME "CGI_PARSER_CONFIG"
1.159 paf 50:
1.42 paf 51: /// IIS refuses to read bigger chunks
52: const size_t READ_POST_CHUNK_SIZE=0x400*0x400; // 1M
53:
1.184 paf 54: static const char *argv0;
1.193 paf 55: static const char *config_filespec_cstr=0;
56: static bool fail_on_config_read_problem=true;
1.192 paf 57:
1.184 paf 58: static Pool *pool; // global pool [dont describe to doxygen: it confuses it with param names]
59: static bool cgi; ///< we were started as CGI?
60: static bool mail_received=false; ///< we were started with -m option? [asked to parse incoming message to $mail:received]
1.5 paf 61:
1.46 paf 62: // SAPI
1.86 parser 63:
1.124 parser 64: static void log(const char *fmt, va_list args) {
1.193 paf 65: bool opened=false;
1.61 paf 66: FILE *f=0;
67:
1.193 paf 68: if(config_filespec_cstr) {
69: char beside_config_path[MAX_STRING];
70: strncpy(beside_config_path, config_filespec_cstr, MAX_STRING-1); beside_config_path[MAX_STRING-1]=0;
71: if(!(
72: rsplit(beside_config_path, '/') ||
73: rsplit(beside_config_path, '\\'))) { // strip filename
74: // no path, just filename
75: beside_config_path[0]='.'; beside_config_path[1]=0;
76: }
77:
78: char file_spec[MAX_STRING];
79: snprintf(file_spec, MAX_STRING,
80: "%s/parser3.log", beside_config_path);
81: f=fopen(file_spec, "at");
82: opened=f!=0;
83: }
1.192 paf 84: // fallback to stderr
1.61 paf 85: if(!opened)
86: f=stderr;
87:
88: // prefix
89: time_t t=time(0);
1.171 paf 90: if(const char *stamp=ctime(&t)) { // never saw that
1.173 paf 91: if(size_t len=strlen(stamp)) // saw once stamp being =""
1.172 paf 92: fprintf(f, "[%.*s] ", len-1, stamp);
1.171 paf 93: }
1.61 paf 94: // message
1.117 parser 95:
96: char buf[MAX_STRING];
97: size_t size=vsnprintf(buf, MAX_STRING, fmt, args);
98: remove_crlf(buf, buf+size);
99:
100: fwrite(buf, size, 1, f);
1.61 paf 101: // newline
102: fprintf(f, "\n");
103:
104: if(opened)
105: fclose(f);
1.85 parser 106: else
107: fflush(f);
1.124 parser 108: }
109:
110: // appends to parser3.log located beside my binary if openable, to stderr otherwize
111: void SAPI::log(Pool& , const char *fmt, ...) {
112: va_list args;
113: va_start(args,fmt);
114: ::log(fmt, args);
115: va_end(args);
116: }
117:
118: void SAPI::die(const char *fmt, ...) {
1.137 paf 119: #ifdef DEBUG_POOL_MALLOC
120: extern void log_pool_stats(Pool& pool);
1.178 paf 121: log_pool_stats(*pool);
1.137 paf 122: #endif
123:
1.144 paf 124: va_list args;
125: va_start(args,fmt);
1.138 paf 126: // log
127:
128: // logging is more important than user
129: // she can cancel download, we'd get SIG_PIPE,
130: // nothing would be logged then
1.124 parser 131: ::log(fmt, args);
132:
1.138 paf 133: // inform user
134:
1.134 paf 135: char body[MAX_STRING];
1.138 paf 136: int content_length=vsnprintf(body, MAX_STRING, fmt, args);
1.134 paf 137:
1.144 paf 138: va_end(args);
139:
1.134 paf 140: // prepare header
141: // let's be honest, that's bad we couldn't produce valid output
1.178 paf 142: SAPI::add_header_attribute(*pool, "status", "500");
143: SAPI::add_header_attribute(*pool, "content-type", "text/plain");
1.134 paf 144: char content_length_cstr[MAX_NUMBER];
1.168 paf 145: snprintf(content_length_cstr, sizeof(content_length_cstr), "%u", content_length);
1.178 paf 146: SAPI::add_header_attribute(*pool, "content-length", content_length_cstr);
1.134 paf 147:
148: // send header
1.178 paf 149: SAPI::send_header(*pool);
1.134 paf 150:
151: // body
1.178 paf 152: SAPI::send_body(*pool, body, content_length);
1.134 paf 153:
1.124 parser 154: exit(1);
1.61 paf 155: }
156:
1.122 parser 157: const char *SAPI::get_env(Pool& , const char *name) {
1.109 parser 158: return getenv(name);
1.28 paf 159: }
160:
1.180 paf 161: const char *const *SAPI::environment(Pool&) {
162: #ifdef _MSC_VER
163: extern char **_environ;
164: return _environ;
165: #else
166: extern char **environ;
167: return environ;
168: #endif
169: }
170:
1.122 parser 171: size_t SAPI::read_post(Pool& , char *buf, size_t max_bytes) {
1.59 paf 172: size_t read_size=0;
1.12 paf 173: do {
1.36 paf 174: int chunk_size=read(fileno(stdin),
1.42 paf 175: buf+read_size, min(READ_POST_CHUNK_SIZE, max_bytes-read_size));
1.129 paf 176: if(chunk_size<=0)
1.12 paf 177: break;
178: read_size+=chunk_size;
179: } while(read_size<max_bytes);
180:
181: return read_size;
1.10 paf 182: }
183:
1.122 parser 184: void SAPI::add_header_attribute(Pool& , const char *key, const char *value) {
1.68 paf 185: if(cgi)
1.20 paf 186: printf("%s: %s\n", key, value);
1.19 paf 187: }
188:
1.56 paf 189: /// @todo intelligent cache-control
1.122 parser 190: void SAPI::send_header(Pool& ) {
1.33 paf 191: if(cgi) {
1.147 paf 192: // puts("expires: Fri, 23 Mar 2001 09:32:23 GMT");
1.33 paf 193:
194: // header | body delimiter
1.20 paf 195: puts("");
1.33 paf 196: }
1.30 paf 197: }
1.20 paf 198:
1.122 parser 199: void SAPI::send_body(Pool& , const void *buf, size_t size) {
1.19 paf 200: stdout_write(buf, size);
1.58 paf 201: }
202:
1.97 parser 203: //
204:
1.184 paf 205: static void full_file_spec(const char *file_name, char *buf, size_t buf_size) {
1.167 paf 206: if(file_name)
207: if(file_name[0]=='/'
208: #ifdef WIN32
209: || (file_name[0] && file_name[1]==':')
210: #endif
211: )
212: strncpy(buf, file_name, buf_size);
213: else {
214: char cwd[MAX_STRING]; getcwd(cwd, MAX_STRING);
215: snprintf(buf, buf_size, "%s/%s", cwd, file_name);
216: }
217: else
218: buf[0]=0;
1.166 paf 219: #ifdef WIN32
220: back_slashes_to_slashes(buf);
221: #endif
1.97 parser 222: }
223:
1.40 paf 224: /**
1.122 parser 225: main workhorse
1.19 paf 226:
1.122 parser 227: @todo
1.40 paf 228: IIS: remove trailing default-document[index.html] from $request.uri.
229: to do that we need to consult metabase,
230: wich is tested but seems slow.
1.144 paf 231: IIS5 todo find out proper 'illegal call' check
1.40 paf 232: */
1.184 paf 233: static void real_parser_handler(
1.122 parser 234: const char *filespec_to_process,
235: const char *request_method, bool header_only) {
236: // init socks
1.178 paf 237: init_socks(*pool);
1.122 parser 238:
239: // init global classes
1.178 paf 240: init_methoded_array(*pool);
1.122 parser 241: // init global variables
1.178 paf 242: pa_globals_init(*pool);
1.122 parser 243:
1.186 paf 244: if(!filespec_to_process || !*filespec_to_process)
1.144 paf 245: SAPI::die("Parser/%s", PARSER_VERSION);
1.122 parser 246:
247: // Request info
248: Request::Info request_info;
1.166 paf 249: char document_root_buf[MAX_STRING];
1.122 parser 250: if(cgi) {
1.178 paf 251: if(const char *env_document_root=SAPI::get_env(*pool, "DOCUMENT_ROOT"))
1.122 parser 252: request_info.document_root=env_document_root;
1.178 paf 253: else if(const char *path_info=SAPI::get_env(*pool, "PATH_INFO")) {
1.122 parser 254: // IIS
1.166 paf 255: size_t len=min(sizeof(document_root_buf)-1, strlen(filespec_to_process)-strlen(path_info));
256: memcpy(document_root_buf, filespec_to_process, len); document_root_buf[len]=0;
257: request_info.document_root=document_root_buf;
1.122 parser 258: } else
1.165 paf 259: throw Exception("parser.runtime",
260: 0,
261: "CGI: no PATH_INFO defined(in reinventing DOCUMENT_ROOT)");
1.122 parser 262: } else {
1.166 paf 263: full_file_spec("", document_root_buf, sizeof(document_root_buf));
264: request_info.document_root=document_root_buf;
1.122 parser 265: }
266: request_info.path_translated=filespec_to_process;
267: request_info.method=request_method ? request_method : "GET";
1.178 paf 268: const char *query_string=SAPI::get_env(*pool, "QUERY_STRING");
1.122 parser 269: request_info.query_string=query_string;
270: if(cgi) {
1.178 paf 271: if(const char *env_request_uri=SAPI::get_env(*pool, "REQUEST_URI"))
1.122 parser 272: request_info.uri=env_request_uri;
1.178 paf 273: else if(const char *path_info=SAPI::get_env(*pool, "PATH_INFO"))
1.122 parser 274: if(query_string) {
1.178 paf 275: char *reconstructed_uri=(char *)pool->malloc(
1.122 parser 276: strlen(path_info)+1/*'?'*/+
277: strlen(query_string)+1/*0*/);
278: strcpy(reconstructed_uri, path_info);
279: strcat(reconstructed_uri, "?");
280: strcat(reconstructed_uri, query_string);
281: request_info.uri=reconstructed_uri;
282: } else
283: request_info.uri=path_info;
1.179 paf 284: else
285: throw Exception("parser.runtime",
286: 0,
287: "CGI: no PATH_INFO defined(in reinventing REQUEST_URI)");
1.145 paf 288:
289: #ifndef WIN32
290: // they've changed this under IIS5.
1.178 paf 291: if(const char *script_name=SAPI::get_env(*pool, "SCRIPT_NAME")) {
1.122 parser 292: size_t script_name_len=strlen(script_name);
293: size_t uri_len=strlen(request_info.uri);
294: if(strncmp(request_info.uri,script_name, script_name_len)==0 &&
295: script_name_len != uri_len) // under IIS they are the same
1.144 paf 296: SAPI::die("CGI: illegal call");
1.122 parser 297: }
1.145 paf 298: #endif
1.122 parser 299: } else
1.177 paf 300: request_info.uri="";
1.122 parser 301:
1.178 paf 302: request_info.content_type=SAPI::get_env(*pool, "CONTENT_TYPE");
303: const char *content_length=SAPI::get_env(*pool, "CONTENT_LENGTH");
1.122 parser 304: request_info.content_length=(content_length?atoi(content_length):0);
1.178 paf 305: request_info.cookie=SAPI::get_env(*pool, "HTTP_COOKIE");
1.184 paf 306: request_info.mail_received=mail_received;
307:
1.122 parser 308: // prepare to process request
1.178 paf 309: Request request(*pool,
1.122 parser 310: request_info,
1.184 paf 311: /*#ifdef _DEBUG
1.143 paf 312: String::UL_HTML|String::UL_OPTIMIZE_BIT
1.184 paf 313: #else*/
1.143 paf 314: cgi ? String::UL_HTML|String::UL_OPTIMIZE_BIT : String::UL_AS_IS
1.184 paf 315: /*#endif*/
1.143 paf 316: ,
1.130 paf 317: true /* status_allowed */);
1.122 parser 318:
1.181 paf 319: char config_filespec_buf[MAX_STRING];
1.193 paf 320: if(!config_filespec_cstr) {
321: const char *config_by_env=getenv(PARSER_CONFIG_ENV_NAME);
322: if(!config_by_env)
323: config_by_env=getenv(REDIRECT_PREFIX PARSER_CONFIG_ENV_NAME);
324: if(config_by_env)
325: config_filespec_cstr=config_by_env;
326: else {
327: // beside by binary
328: char beside_binary_path[MAX_STRING];
329: strncpy(beside_binary_path, argv0, MAX_STRING-1); beside_binary_path[MAX_STRING-1]=0; // filespec of my binary
330: if(!(
331: rsplit(beside_binary_path, '/') ||
332: rsplit(beside_binary_path, '\\'))) { // strip filename
333: // no path, just filename
334: // @todo full path, not ./!
335: beside_binary_path[0]='.'; beside_binary_path[1]=0;
336: }
337: snprintf(config_filespec_buf, MAX_STRING,
338: "%s/%s",
339: beside_binary_path, AUTO_FILE_NAME);
340: config_filespec_cstr=config_filespec_buf;
341: fail_on_config_read_problem=false;
342: }
1.122 parser 343: }
344:
345: // process the request
346: request.core(
1.193 paf 347: config_filespec_cstr, fail_on_config_read_problem,
1.122 parser 348: header_only);
349:
350: //
351: done_socks();
352:
353: #ifdef DEBUG_POOL_MALLOC
354: extern void log_pool_stats(Pool& pool);
1.178 paf 355: log_pool_stats(*pool);
1.122 parser 356: #endif
1.160 paf 357:
358: #ifdef DEBUG_STRING_APPENDS_VS_EXPANDS
1.178 paf 359: SAPI::log(*pool,
1.161 paf 360: "string piece appends=%lu, wcontext_result_size=%lu, string_string_shortcut_economy_closer=%lu, total_alloc_size=%lu",
1.160 paf 361: string_piece_appends,
362: wcontext_result_size,
363: string_string_shortcut_economy,
364: total_alloc_size);
365: #endif
366:
1.122 parser 367: }
368:
1.184 paf 369: static void call_real_parser_handler__do_SEH(
1.122 parser 370: const char *filespec_to_process,
371: const char *request_method, bool header_only) {
1.133 paf 372: #if _MSC_VER && !defined(_DEBUG)
1.122 parser 373: LPEXCEPTION_POINTERS system_exception=0;
374: __try {
375: #endif
376: real_parser_handler(
377: filespec_to_process,
378: request_method, header_only);
379:
1.133 paf 380: #if _MSC_VER && !defined(_DEBUG)
1.122 parser 381: } __except (
382: (system_exception=GetExceptionInformation()),
383: EXCEPTION_EXECUTE_HANDLER) {
384:
385: if(system_exception)
386: if(_EXCEPTION_RECORD *er=system_exception->ExceptionRecord)
1.165 paf 387: throw Exception(0,
388: 0,
389: "Exception 0x%08X at 0x%08X", er->ExceptionCode, er->ExceptionAddress);
1.122 parser 390: else
1.165 paf 391: throw Exception(0, 0, "Exception <no exception record>");
1.122 parser 392: else
1.165 paf 393: throw Exception(0, 0, "Exception <no exception information>");
1.122 parser 394: }
395: #endif
396: }
397:
1.139 paf 398: #if _MSC_VER
1.135 paf 399: int failed_new(size_t size) {
400: SAPI::die("out of memory in 'new', failed to allocated %u bytes", size);
401: return 0; // not reached
1.131 paf 402: }
1.135 paf 403: #endif
1.131 paf 404:
1.135 paf 405: #ifdef HAVE_SET_NEW_HANDLER
1.184 paf 406: static void failed_new() {
1.135 paf 407: SAPI::die("out of memory in 'new'");
1.131 paf 408: }
409: #endif
410:
1.184 paf 411: static void usage(const char *program) {
1.188 paf 412: printf(
1.184 paf 413: "Parser/%s Copyright(c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)\n"
414: "Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)\n"
415: "\n"
416: "Usage: %s [options] file\n"
417: "Options are:\n"
1.185 paf 418: #ifdef WITH_MAILRECEIVE
1.193 paf 419: " -m Parse mail, put received letter to $mail:received\n"
1.184 paf 420: #endif
1.193 paf 421: " -f config_file Use this config file (/path/to/auto.p)\n"
422: " -h Display usage information (this message)\n"
1.184 paf 423: , PARSER_VERSION,
424: program);
425: exit(EINVAL);
426: }
427:
1.194 ! paf 428: int main(int raw_argc, char *raw_argv[]) {
! 429: int argc;
! 430: char **argv;
! 431: fixopt(
! 432: raw_argc, raw_argv,
! 433: argc, argv);
! 434:
1.178 paf 435: Pool_storage global_pool_storage;
436: Pool global_pool(&global_pool_storage);
437: pool=&global_pool;
438:
1.185 paf 439: #ifdef DEBUG_MAILRECEIVE
440: if(FILE *fake_in=fopen(DEBUG_MAILRECEIVE, "rt")) {
1.184 paf 441: dup2(fake_in->_file, 0/*STDIN_FILENO*/);
442: }
443: #endif
444:
1.178 paf 445: #ifdef _DEBUG
446: // _crtBreakAlloc=33112;
447: #endif
1.144 paf 448: // _asm int 3;
1.193 paf 449: argv0=argv[0];
1.45 paf 450:
1.32 paf 451: umask(2);
452:
1.3 paf 453: // were we started as CGI?
1.146 paf 454: cgi=
1.109 parser 455: getenv("SERVER_SOFTWARE") ||
456: getenv("SERVER_NAME") ||
457: getenv("GATEWAY_INTERFACE") ||
458: getenv("REQUEST_METHOD");
1.5 paf 459:
1.184 paf 460: char *raw_filespec_to_process;
461: if(cgi)
462: raw_filespec_to_process=getenv("PATH_TRANSLATED");
463: else {
464: optind = 1;
465: opterr = 0;
466: int c;
1.193 paf 467: while((c = getopt(argc, argv, "hf:"
1.185 paf 468: #ifdef WITH_MAILRECEIVE
1.184 paf 469: "m"
470: #endif
471: )) > 0) {
472: switch (c) {
473: case 'h':
474: usage(argv[0]);
1.193 paf 475: break;
476: case 'f':
477: config_filespec_cstr=optarg;
1.184 paf 478: break;
1.185 paf 479: #ifdef WITH_MAILRECEIVE
1.184 paf 480: case 'm':
481: mail_received=true;
482: break;
483: #endif
484: default:
485: fprintf(stderr, "%s: invalid option '%c'\n", argv[0], optopt);
486: usage(argv[0]);
487: break;
488: }
489: }
490: if (optind != argc - 1) {
491: fprintf(stderr, "%s: file not specified\n", argv[0]);
492: usage(argv[0]);
1.10 paf 493: }
1.184 paf 494:
495: raw_filespec_to_process=argv[optind++];
1.10 paf 496: }
497:
1.100 parser 498: #ifdef WIN32
499: setmode(fileno(stdin), _O_BINARY);
500: setmode(fileno(stdout), _O_BINARY);
501: setmode(fileno(stderr), _O_BINARY);
502: #endif
503:
1.139 paf 504: #if _MSC_VER
1.138 paf 505: _set_new_handler(failed_new);
1.148 paf 506:
507: #ifdef _DEBUG
508: // Get current flag
509: int tmpFlag = _CrtSetDbgFlag( _CRTDBG_REPORT_FLAG );
510:
511: // Turn on leak-checking bit
512: tmpFlag |= _CRTDBG_LEAK_CHECK_DF;
513:
514: // Set flag to the new value
515: _CrtSetDbgFlag( tmpFlag );
516: // _CrtSetBreakAlloc(471);
517:
518: #endif
519:
1.138 paf 520: #endif
521:
522: #ifdef HAVE_SET_NEW_HANDLER
523: std::set_new_handler(failed_new);
524: #endif
525:
1.166 paf 526: char filespec_to_process[MAX_STRING];
527: full_file_spec(raw_filespec_to_process, filespec_to_process, sizeof(filespec_to_process));
1.10 paf 528:
1.109 parser 529: const char *request_method=getenv("REQUEST_METHOD");
1.35 paf 530: bool header_only=request_method && strcasecmp(request_method, "HEAD")==0;
1.131 paf 531:
1.122 parser 532: try { // global try
533: call_real_parser_handler__do_SEH(
534: filespec_to_process,
535: request_method, header_only);
536: } catch(const Exception& e) { // global problem
1.44 paf 537: // don't allocate anything on pool here:
538: // possible pool' exception not catch-ed now
539: // and there could be out-of-memory exception
1.43 paf 540:
1.144 paf 541: SAPI::die("exception in request exception handler: %s", e.comment());
1.134 paf 542: #ifndef _DEBUG
1.131 paf 543: } catch(...) {
1.134 paf 544: SAPI::die("<unknown exception>");
1.133 paf 545: #endif
1.16 paf 546: }
1.122 parser 547:
1.109 parser 548:
549: #ifndef WIN32
550: //
551: if(!cgi)
1.178 paf 552: SAPI::send_body(*pool, "\n", 1);
1.109 parser 553: #endif
1.156 paf 554: //_asm int 3;
1.134 paf 555: return 0;
1.1 paf 556: }
E-mail: