Annotation of parser3/src/main/pa_charsets.C, revision 1.28

1.1       paf         1: /** @file
                      2:        Parser: sql driver manager implementation.
                      3: 
1.27      moko        4:        Copyright (c) 2001-2024 Art. Lebedev Studio (http://www.artlebedev.com)
1.26      moko        5:        Authors: Konstantin Morshnev <moko@design.ru>, Alexandr Petrosian <paf@design.ru>
1.9       paf         6: */
1.1       paf         7: 
1.19      moko        8: #include "pa_charsets.h"
1.1       paf         9: 
1.28    ! moko       10: volatile const char * IDENT_PA_CHARSETS_C="$Id: pa_charsets.C,v 1.27 2024/11/04 03:53:25 moko Exp $" IDENT_PA_CHARSETS_H;
1.12      paf        11: 
                     12: // defines for globals
                     13: 
                     14: #define CHARSET_UTF8_NAME "UTF-8"
1.1       paf        15: 
                     16: // globals
                     17: 
1.28    ! moko       18: static String charset_utf8_name(CHARSET_UTF8_NAME);
        !            19: Charset pa_UTF8_charset(0, charset_utf8_name, 0/*no file=system*/);
1.1       paf        20: 
1.23      moko       21: Charsets pa_charsets;
1.1       paf        22: 
1.12      paf        23: // methods
1.1       paf        24: 
1.12      paf        25: Charsets::Charsets() {
1.23      moko       26:        put(pa_UTF8_charset.NAME(), &pa_UTF8_charset);
1.1       paf        27: }
                     28: 
1.22      moko       29: Charset& Charsets::get(String::Body ANAME) {
                     30:        ANAME=str_upper(ANAME.cstr(), ANAME.length());
1.18      misha      31:        if(Charset* result=HashString<value_type>::get(ANAME))
1.2       paf        32:                return *result;
                     33:        else
1.22      moko       34:                throw Exception(PARSER_RUNTIME, new String(ANAME, String::L_TAINTED), "unknown charset");
                     35: }
                     36: 
                     37: Charset& Charsets::get_direct(const char *ANAME) {
                     38:        if(Charset* result=HashString<value_type>::get(ANAME))
                     39:                return *result;
                     40:        else
                     41:                throw Exception(PARSER_RUNTIME, new String(ANAME, String::L_TAINTED), "unknown charset");
1.2       paf        42: }
1.3       paf        43: 
1.20      moko       44: Charset* Charsets::checkBOM(char *&body,size_t &body_size, Charset* enforced_charset){
                     45:        if((!enforced_charset || enforced_charset->isUTF8()) && (body_size>=3 && strncmp(body, "\xEF\xBB\xBF", 3)==0)){
                     46:                // skip UTF-8 signature (BOM code)
                     47:                body+=3;
                     48:                body_size-=3;
1.23      moko       49:                return &pa_UTF8_charset;
1.20      moko       50:        }
                     51:        return enforced_charset;
                     52: }
                     53: 
1.22      moko       54: void Charsets::load_charset(Request_charsets& charsets, String::Body ANAME, const String& afile_spec) {
                     55:        ANAME=str_upper(ANAME.cstr(), ANAME.length());
1.3       paf        56:        //we know that charset?
1.18      misha      57:        if(HashString<value_type>::get(ANAME))
1.3       paf        58:                return; // don't load it then
                     59: 
1.12      paf        60:        put(ANAME, new Charset(&charsets, ANAME, &afile_spec));
1.4       paf        61: }

E-mail: