Annotation of parser3/src/main/pa_globals.C, revision 1.137

1.15      paf         1: /** @file
1.16      paf         2:        Parser: globals.
                      3: 
1.112     paf         4:        Copyright (c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)
1.113     paf         5:        Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)
1.133     paf         6: */
1.16      paf         7: 
1.137   ! paf         8: static const char* IDENT_GLOBALS_C="$Date: 2002/08/06 09:07:59 $";
1.1       paf         9: 
1.102     paf        10: #include "pa_config_includes.h"
                     11: 
                     12: #ifdef XML
                     13: #include "libxslt/extensions.h"
                     14: #include "libxslt/xsltutils.h"
1.116     paf        15: extern "C" {
1.102     paf        16: #include "libexslt/exslt.h"
1.116     paf        17: };
1.102     paf        18: #endif
                     19: 
1.1       paf        20: #include "pa_globals.h"
1.32      paf        21: #include "pa_string.h"
                     22: #include "pa_hash.h"
1.42      paf        23: #include "pa_sql_driver_manager.h"
1.77      parser     24: #include "pa_dictionary.h"
1.100     paf        25: #include "pa_stylesheet_manager.h"
1.83      parser     26: #include "pa_sapi.h"
1.90      paf        27: #include "pa_cache_managers.h"
1.95      paf        28: #include "pa_charsets.h"
                     29: #include "pa_charset.h"
1.101     paf        30: #include "pa_threads.h"
1.84      parser     31: 
1.8       paf        32: String *content_type_name;
1.75      parser     33: String *charset_name;
1.8       paf        34: String *body_name;
1.13      paf        35: String *value_name;
1.14      paf        36: String *expires_name;
                     37: String *path_name;
1.17      paf        38: String *name_name;
                     39: String *size_name;
                     40: String *text_name;
1.8       paf        41: 
1.39      paf        42: String *content_disposition_name;
                     43: String *content_disposition_filename_name;
                     44: 
1.130     paf        45: String *conf_method_name;
1.1       paf        46: String *auto_method_name;
                     47: 
                     48: String *main_class_name;
                     49: 
1.6       paf        50: String *result_var_name;
1.64      parser     51: String *match_var_name;
1.6       paf        52: 
1.119     paf        53: String *exception_var_name;
                     54: String *exception_type_part_name;
                     55: String *exception_source_part_name;
                     56: String *exception_comment_part_name;
                     57: String *exception_handled_part_name;
                     58: 
1.79      parser     59: String *charsets_name;
1.36      paf        60: String *mime_types_name;
                     61: String *vfile_mime_type_name;
1.63      parser     62: String *origins_mode_name;
1.67      parser     63: 
1.69      parser     64: String *class_path_name;
                     65: 
1.67      parser     66: String *switch_data_name;
                     67: 
1.120     paf        68: String *cache_data_name;
                     69: 
1.70      parser     70: String *sql_limit_name;
                     71: String *sql_offset_name;
                     72: String *sql_default_name;
                     73: 
1.95      paf        74: String *charset_UTF8_name;
                     75: 
1.71      parser     76: String *hash_default_element_name;
1.42      paf        77: 
1.124     paf        78: Table *string_match_table_template;
1.123     paf        79: 
1.135     paf        80: Table *date_calendar_table_template;
                     81: 
1.1       paf        82: Hash *untaint_lang_name2enum;
                     83: 
1.95      paf        84: Charset *utf8_charset;
1.32      paf        85: 
1.5       paf        86: short hex_value[0x100];
1.111     paf        87: 
                     88: #ifdef XML
                     89: GdomeDOMImplementation *domimpl;
                     90: #endif
1.5       paf        91: 
                     92: static void setup_hex_value() {
1.68      parser     93:        memset(hex_value, 0, sizeof(hex_value));
1.5       paf        94:        hex_value['0'] = 0;     
                     95:        hex_value['1'] = 1;     
                     96:        hex_value['2'] = 2;     
                     97:        hex_value['3'] = 3;     
                     98:        hex_value['4'] = 4;     
                     99:        hex_value['5'] = 5;     
                    100:        hex_value['6'] = 6;     
                    101:        hex_value['7'] = 7;     
                    102:        hex_value['8'] = 8;     
                    103:        hex_value['9'] = 9;
                    104:        hex_value['A'] = 10;
                    105:        hex_value['B'] = 11;
                    106:        hex_value['C'] = 12;
                    107:        hex_value['D'] = 13;
                    108:        hex_value['E'] = 14;
                    109:        hex_value['F'] = 15;
                    110:        hex_value['a'] = 10;
                    111:        hex_value['b'] = 11;
                    112:        hex_value['c'] = 12;
                    113:        hex_value['d'] = 13;
                    114:        hex_value['e'] = 14;
                    115:        hex_value['f'] = 15;
                    116: }
1.1       paf       117: 
1.99      paf       118: #ifdef XML
1.101     paf       119: 
                    120: const int MAX_CONCURRENT_XML_GENERIC_ERROR_THREADS=10;
                    121: 
                    122: struct XML_Generic_error_info {
                    123:        pa_thread_t thread_id;
                    124:        char *message;
                    125: } xml_generic_error_infos[MAX_CONCURRENT_XML_GENERIC_ERROR_THREADS];
                    126: 
                    127: XML_Generic_error_info *xml_generic_error_info(pa_thread_t thread_id) {
                    128:        for(int i=0; i<MAX_CONCURRENT_XML_GENERIC_ERROR_THREADS; i++) {
                    129:                XML_Generic_error_info *p=xml_generic_error_infos+i;
                    130:                if(p->thread_id==thread_id)
                    131:                        return p;
                    132:        }
                    133:        return 0;
                    134: }
                    135: 
1.99      paf       136: static void
1.101     paf       137: xmlParserGenericErrorFunc(void *ctx, const char *msg, ...) { 
                    138:     pa_thread_t thread_id=pa_get_thread_id();
                    139: 
                    140:        // infinitely looking for free slot to fill it
                    141:        while(true) {
                    142:                SYNCHRONIZED;  // find+fill blocked
                    143: 
                    144:                // first try to get existing for this thread_id
                    145:                XML_Generic_error_info *p=xml_generic_error_info(thread_id);
                    146:                if(!p) { // occupy empty one
                    147:                        p=xml_generic_error_info(0);
                    148:                        if(!p) // wait for empty for it to appear
                    149:                                continue;
                    150:                }
                    151: 
1.102     paf       152:                p->thread_id=thread_id;
1.101     paf       153:                size_t offset=p->message?strlen(p->message):0;
                    154:                p->message=(char *)realloc(p->message, offset+MAX_STRING);
                    155:                if(!p->message)
                    156:                        SAPI::die(
                    157:                                "out of memory in 'xmlParserGenericErrorFunc', failed to reallocate to %u bytes", 
                    158:                                offset+MAX_STRING);
                    159:                
                    160:                va_list args;
                    161:                va_start(args, msg);
                    162:                vsnprintf(p->message+offset, MAX_STRING, msg, args);
                    163:                va_end(args);
                    164: 
                    165:                break;
                    166:        }
                    167: }
                    168: 
1.102     paf       169: bool xmlHaveGenericErrors() {
                    170:     pa_thread_t thread_id=pa_get_thread_id();
                    171: 
                    172:        SYNCHRONIZED;  // find blocked
                    173: 
                    174:        return xml_generic_error_info(thread_id)!=0;
                    175: }
                    176: 
1.101     paf       177: const char *xmlGenericErrors() {
                    178:     pa_thread_t thread_id=pa_get_thread_id();
                    179: 
                    180:        SYNCHRONIZED;  // find+free blocked
                    181: 
                    182:        XML_Generic_error_info *p=xml_generic_error_info(thread_id);
                    183:        if(!p) // no errors for our thread_id registered
                    184:                return 0;
                    185: 
                    186:        const char *result=p->message;
                    187: 
                    188:        // free slot up 
                    189:        memset(p, 0, sizeof(*p));
                    190: 
                    191:        // it is up to caller to free it
                    192:        return result;
1.99      paf       193: }
1.110     paf       194: 
                    195: /**
                    196:  * xmlFileMatchWithLocalhostEqDocumentRoot:
                    197:  * filename:  the URI for matching
                    198:  *
                    199:  * check if the URI matches an HTTP one
                    200:  *
                    201:  * Returns 1 if matches, 0 otherwise
                    202:  */
                    203: static int
                    204: xmlFileMatchLocalhost(const char *filename) {
                    205:     if (!strncmp(filename, "http://localhost", 16))
                    206:        return(1);
                    207:     return(0);
                    208: }
                    209: 
                    210: 
                    211: /**
                    212:  * xmlFileOpenHttpLocalhost :
                    213:  * filename:  the URI for matching
                    214:  *
                    215:  * http://localhost/abc -> $ENV{DOCUMENT_ROOT}/abc | ./abc
                    216:  *
                    217:  * input from FILE *, supports compressed input
                    218:  * if filename is " " then the standard input is used
                    219:  *
                    220:  * Returns an I/O context or NULL in case of error
                    221:  */
                    222: static void *
                    223: xmlFileOpenLocalhost (const char *filename) {
                    224:     FILE *fd;
                    225:     const char* documentRoot;
                    226:     char path[1000];
                    227: 
                    228:        path[0]=0;
                    229:        strcat(path, (documentRoot=getenv("DOCUMENT_ROOT"))?documentRoot:".");
                    230:        strcat(path, &filename[16]);
                    231: 
                    232: #ifdef WIN32
                    233:     fd = fopen(path, "rb");
                    234: #else
                    235:     fd = fopen(path, "r");
                    236: #endif /* WIN32 */
                    237:     return((void *) fd);
                    238: }
                    239: 
                    240: /**
                    241:  * xmlFileRead:
                    242:  * @context:  the I/O context
                    243:  * @buffer:  where to drop data
                    244:  * @len:  number of bytes to write
                    245:  *
                    246:  * Read @len bytes to @buffer from the I/O channel.
                    247:  *
                    248:  * Returns the number of bytes written
                    249:  */
                    250: static int
                    251: xmlFileRead (void * context, char * buffer, int len) {
                    252:     return(fread(&buffer[0], 1,  len, (FILE *) context));
                    253: }
                    254: 
                    255: /**
                    256:  * xmlFileWrite:
                    257:  * @context:  the I/O context
                    258:  * @buffer:  where to drop data
                    259:  * @len:  number of bytes to write
                    260:  *
                    261:  * Write @len bytes from @buffer to the I/O channel.
                    262:  *
                    263:  * Returns the number of bytes written
                    264:  */
                    265: static int
                    266: xmlFileWrite (void * context, const char * buffer, int len) {
                    267:     return(fwrite(&buffer[0], 1,  len, (FILE *) context));
                    268: }
                    269: 
                    270: /**
                    271:  * xmlFileClose:
                    272:  * @context:  the I/O context
                    273:  *
                    274:  * Close an I/O channel
                    275:  */
                    276: static int
                    277: xmlFileClose (void * context) {
                    278:     return ( ( fclose((FILE *) context) == EOF ) ? -1 : 0 );
                    279: }
                    280: 
1.99      paf       281: #endif
                    282: 
1.83      parser    283: void pa_globals_destroy(void *) {
                    284:        try {
1.96      paf       285: #ifdef XML
                    286:                GdomeException exc;
                    287:                gdome_di_unref (domimpl, &exc);
                    288: #endif
1.93      paf       289:                if(cache_managers)
                    290:                        cache_managers->~Cache_managers();
1.95      paf       291: 
                    292:                charsets->~Charsets();
1.83      parser    293:                
                    294:        } catch(const Exception& e) {
                    295:                SAPI::die("pa_globals_destroy failed: %s", e.comment());
                    296:        }
                    297: }
                    298: 
1.108     paf       299: /// @test hint on one should call this for each thread xmlSubstituteEntitiesDefault(1);
1.27      paf       300: void pa_globals_init(Pool& pool) {
1.83      parser    301:        pool.register_cleanup(pa_globals_destroy, 0);
                    302: 
1.32      paf       303:        #undef NEW
                    304:        #define NEW new(pool)
                    305: 
1.5       paf       306:        // hex value
                    307:        setup_hex_value();
                    308: 
1.1       paf       309:        // names
1.32      paf       310:        content_type_name=NEW String(pool, CONTENT_TYPE_NAME);
1.75      parser    311:        charset_name=NEW String(pool, CHARSET_NAME);
1.32      paf       312:        body_name=NEW String(pool, BODY_NAME);
                    313:        value_name=NEW String(pool, VALUE_NAME);
                    314:        expires_name=NEW String(pool, EXPIRES_NAME);
                    315:        path_name=NEW String(pool, PATH_NAME);
                    316:        name_name=NEW String(pool, NAME_NAME);
                    317:        size_name=NEW String(pool, SIZE_NAME);
                    318:        text_name=NEW String(pool, TEXT_NAME);
                    319: 
1.39      paf       320:        content_disposition_name=NEW String(pool, CONTENT_DISPOSITION_NAME);
                    321:        content_disposition_filename_name=NEW String(pool, CONTENT_DISPOSITION_FILENAME_NAME);
1.32      paf       322: 
1.130     paf       323:        conf_method_name=NEW String(pool, CONF_METHOD_NAME);
1.32      paf       324:        auto_method_name=NEW String(pool, AUTO_METHOD_NAME);
                    325: 
                    326:        main_class_name=NEW String(pool, MAIN_CLASS_NAME);
1.6       paf       327: 
1.32      paf       328:        result_var_name=NEW String(pool, RESULT_VAR_NAME);
1.64      parser    329:        match_var_name=NEW String(pool, MATCH_VAR_NAME);
1.6       paf       330: 
1.119     paf       331:        exception_var_name=NEW String(pool, EXCEPTION_VAR_NAME);
                    332:        exception_type_part_name=NEW String(pool, EXCEPTION_TYPE_PART_NAME);
                    333:        exception_source_part_name=NEW String(pool, EXCEPTION_SOURCE_PART_NAME);
                    334:        exception_comment_part_name=NEW String(pool, EXCEPTION_COMMENT_PART_NAME);
                    335:        exception_handled_part_name=NEW String(pool, EXCEPTION_HANDLED_PART_NAME);
1.4       paf       336: 
1.79      parser    337:        charsets_name=NEW String(pool, CHARSETS_NAME);
1.36      paf       338:        mime_types_name=NEW String(pool, MIME_TYPES_NAME);
1.63      parser    339:        origins_mode_name=NEW String(pool, ORIGINS_MODE_NAME);
1.69      parser    340: 
                    341:        class_path_name=NEW String(pool, CLASS_PATH_NAME);
1.66      parser    342: 
                    343:        //^switch ^case
                    344:        switch_data_name=NEW String(pool, SWITCH_DATA_NAME);
1.120     paf       345: 
                    346:        //^cache
                    347:        cache_data_name=NEW String(pool, CACHE_DATA_NAME);
1.70      parser    348: 
                    349:        // sql
                    350:        sql_limit_name=NEW String(pool, SQL_LIMIT_NAME);
                    351:        sql_offset_name=NEW String(pool, SQL_OFFSET_NAME);
                    352:        sql_default_name=NEW String(pool, SQL_DEFAULT_NAME);
1.71      parser    353: 
1.95      paf       354:        // charsets
                    355:        charset_UTF8_name=NEW String(pool, CHARSET_UTF8_NAME);
                    356: 
1.71      parser    357:        // hash
                    358:        hash_default_element_name=NEW String(pool, HASH_DEFAULT_ELEMENT_NAME);
1.70      parser    359: 
1.1       paf       360:        // hashes
1.32      paf       361:        untaint_lang_name2enum=NEW Hash(pool);
1.87      paf       362:        #define ULN(cstr, LANG) \
                    363:                untaint_lang_name2enum->put(*NEW String(pool, cstr), (int)String::UL_##LANG);
                    364:        ULN("as-is", AS_IS);
                    365:        ULN("file-spec", FILE_SPEC);
                    366:        ULN("http-header", HTTP_HEADER);
                    367:        ULN("mail-header", MAIL_HEADER);
                    368:        ULN("uri", URI);
                    369:        ULN("table", TABLE);
                    370:        ULN("sql", SQL);
                    371:        ULN("js", JS);
                    372:        ULN("xml", XML);
                    373:        ULN("html", HTML);
1.92      paf       374:        ULN("optimized-html", HTML|String::UL_OPTIMIZE_BIT);
1.123     paf       375: 
1.135     paf       376:        // string_match_table_template
                    377:        {
                    378:                Array *columns=NEW Array(pool);
                    379:                *columns+=NEW String(pool, STRING_PRE_MATCH_NAME);
                    380:                *columns+=NEW String(pool, STRING_MATCH_NAME);
                    381:                *columns+=NEW String(pool, STRING_POST_MATCH_NAME);
1.123     paf       382:                for(int i=1; i<=MAX_STRING_MATCH_TABLE_COLUMNS; i++) {
1.125     paf       383:                        char *column=(char *)pool.malloc(MAX_NUMBER);
1.123     paf       384:                        snprintf(column, MAX_NUMBER, "%d", i);
1.135     paf       385:                        *columns+=NEW String(pool, column); // .i column name
                    386:                }
                    387:                string_match_table_template=NEW Table(pool, 0, columns);
                    388:        }
                    389: 
                    390:        // date_calendar_table_template
                    391:        {
                    392:                Array *columns=NEW Array(pool);
                    393:                for(int i=0; i<=6; i++) {
                    394:                        char *column=(char *)pool.malloc(MAX_NUMBER);
                    395:                        snprintf(column, MAX_NUMBER, "%d", i);
                    396:                        *columns+=NEW String(pool, column); // .i column name
1.123     paf       397:                }
1.135     paf       398:                *columns+=NEW String(pool, DATE_CALENDAR_WEEKNO_NAME);
1.137   ! paf       399:                *columns+=NEW String(pool, DATE_CALENDAR_WEEKYEAR_NAME);
1.135     paf       400:                date_calendar_table_template=NEW Table(pool, 0, columns);
1.123     paf       401:        }
1.1       paf       402: 
1.95      paf       403:        // charsets
                    404:        charsets=NEW Charsets(pool);
                    405:        charsets->put(*charset_UTF8_name, 
                    406:                utf8_charset=NEW Charset(pool, *charset_UTF8_name, 0/*no file=system*/));
1.88      paf       407: 
1.101     paf       408: 
1.88      paf       409:        // Status registration, must be initialized before all registrants
1.90      paf       410:        cache_managers=NEW Cache_managers(pool);
1.42      paf       411: 
1.73      parser    412:        // SQL driver manager
1.90      paf       413:        cache_managers->put(*NEW String(pool, "sql"), 
                    414:                SQL_driver_manager=NEW SQL_Driver_manager(pool));
1.74      parser    415: 
1.76      parser    416: #ifdef XML
1.96      paf       417:        // initializing xml libs
                    418: 
                    419:        /* First I get a DOMImplementation reference */
                    420:        domimpl = gdome_di_mkref ();
                    421:     /*
                    422:      * Register the EXSLT extensions and the test module
                    423:      */
                    424:     exsltRegisterAll();
                    425:     xsltRegisterTestModule();
                    426:     xmlDefaultSAXHandlerInit();
                    427:     /*
                    428:      * disable CDATA from being built in the document tree
                    429:      */
1.101     paf       430:     // never added yet  xmlDefaultSAXHandler.cdataBlock = NULL;
1.99      paf       431: 
                    432:        /*
                    433:         * Initialization function for the XML parser.
                    434:         * This is not reentrant. Call once before processing in case of
                    435:         * use in multithreaded programs.
                    436:        */
                    437:        xmlInitParser();
1.107     paf       438: 
                    439:        // 1. this is needed for proper parsing of stylesheets
                    440:        // there were a situation where honest entity ruined innocent xpath compilation
                    441:        // doc says "you sould turn it on on stylesheet load" without deepening into details
                    442:        // 2. when dom tree with entites goes under transform text nodes 
                    443:        // got [erroreosly] cut on first entity occurance
1.109     paf       444:        // --
1.107     paf       445:        // that is why this is:
                    446:        xmlSubstituteEntitiesDefault(1);
1.100     paf       447:        
                    448:        // Bit in the loadsubset context field to tell to do ID/REFs lookups 
                    449:        xmlLoadExtDtdDefaultValue |= XML_DETECT_IDS;
                    450:        // Bit in the loadsubset context field to tell to do complete the elements attributes lists 
                    451:        // with the ones defaulted from the DTDs 
                    452:     //never added yet xmlLoadExtDtdDefaultValue |= XML_COMPLETE_ATTRS;
1.99      paf       453: 
1.104     paf       454: //regretfully this not only replaces entities on parse, but also on generate   xmlSubstituteEntitiesDefault(1);
1.105     paf       455:        // never switched this on xmlIndentTreeOutput=1;
1.104     paf       456: 
1.101     paf       457:        memset(xml_generic_error_infos, 0, sizeof(xml_generic_error_infos));
                    458:        xmlSetGenericErrorFunc(0, xmlParserGenericErrorFunc);
1.102     paf       459:        xsltSetGenericErrorFunc(0, xmlParserGenericErrorFunc);
1.105     paf       460: //     FILE *f=fopen("y:\\xslt.log", "wt");
                    461: //     xsltSetGenericDebugFunc(f/*stderr*/, 0);
1.110     paf       462: 
                    463:        // http://localhost/abc -> $ENV{DOCUMENT_ROOT}/abc | ./abc
                    464:        xmlRegisterInputCallbacks(
                    465:                xmlFileMatchLocalhost, xmlFileOpenLocalhost,
                    466:                xmlFileRead, xmlFileClose);
1.96      paf       467: 
                    468:        // XSLT stylesheet manager
1.90      paf       469:        cache_managers->put(*NEW String(pool, "stylesheet"), 
                    470:                stylesheet_manager=NEW Stylesheet_manager(pool));
1.76      parser    471: #endif
1.1       paf       472: }
1.76      parser    473: 
                    474: #if defined(XML) && defined(_MSC_VER)
1.132     paf       475: #      define GNOME_LIBS "/parser3project/win32xml/win32/gnome"
1.131     paf       476: #      pragma comment(lib, GNOME_LIBS "/glib/lib/libglib-1.3-11.lib")
1.76      parser    477: #      ifdef _DEBUG
1.131     paf       478: #              pragma comment(lib, GNOME_LIBS "/libxml2-x.x.x/win32/dsp/libxml2_so_debug/libxml2.lib")
                    479: #              pragma comment(lib, GNOME_LIBS "/libxslt-x.x.x/win32/dsp/libexslt_so_debug/libexslt.lib")
                    480: #              pragma comment(lib, GNOME_LIBS "/libxslt-x.x.x/win32/dsp/libxslt_so_debug/libxslt.lib")
                    481: #              pragma comment(lib, GNOME_LIBS "/gdome2-x.x.x/win32/dsp/Debug/libgdome.lib")
1.76      parser    482: #      else
1.131     paf       483: #              pragma comment(lib, GNOME_LIBS "/libxml2-x.x.x/win32/dsp/libxml2_so_release/libxml2.lib")
                    484: #              pragma comment(lib, GNOME_LIBS "/libxslt-x.x.x/win32/dsp/libexslt_so_release/libexslt.lib")
                    485: #              pragma comment(lib, GNOME_LIBS "/libxslt-x.x.x/win32/dsp/libxslt_so_release/libxslt.lib")
                    486: #              pragma comment(lib, GNOME_LIBS "/gdome2-x.x.x/win32/dsp/Release/libgdome.lib")
1.85      paf       487: #      endif
                    488: #endif

E-mail: