--- parser3/src/main/pa_charsets.C 2003/09/25 09:15:03 1.13 +++ parser3/src/main/pa_charsets.C 2023/09/26 20:49:09 1.26 @@ -1,42 +1,59 @@ /** @file Parser: sql driver manager implementation. - Copyright (c) 2001-2003 ArtLebedev Group (http://www.artlebedev.com) - Author: Alexandr Petrosian (http://paf.design.ru) + Copyright (c) 2001-2023 Art. Lebedev Studio (http://www.artlebedev.com) + Authors: Konstantin Morshnev , Alexandr Petrosian */ -static const char* IDENT_CHARSETS_C="$Date: 2003/09/25 09:15:03 $"; - #include "pa_charsets.h" +volatile const char * IDENT_PA_CHARSETS_C="$Id: pa_charsets.C,v 1.26 2023/09/26 20:49:09 moko Exp $" IDENT_PA_CHARSETS_H; + // defines for globals #define CHARSET_UTF8_NAME "UTF-8" // globals -Charset UTF8_charset(0, *new String(CHARSET_UTF8_NAME), 0/*no file=system*/); +Charset pa_UTF8_charset(0, *new String(CHARSET_UTF8_NAME), 0/*no file=system*/); -Charsets charsets; +Charsets pa_charsets; // methods Charsets::Charsets() { - put(UTF8_charset.NAME(), &UTF8_charset); + put(pa_UTF8_charset.NAME(), &pa_UTF8_charset); +} + +Charset& Charsets::get(String::Body ANAME) { + ANAME=str_upper(ANAME.cstr(), ANAME.length()); + if(Charset* result=HashString::get(ANAME)) + return *result; + else + throw Exception(PARSER_RUNTIME, new String(ANAME, String::L_TAINTED), "unknown charset"); } -Charset& Charsets::get(const String::Body ANAME) { - if(Charset* result=Hash::get(ANAME)) +Charset& Charsets::get_direct(const char *ANAME) { + if(Charset* result=HashString::get(ANAME)) return *result; else - throw Exception("parser.runtime", - new String(ANAME, String::L_TAINTED), - "unknown charset"); + throw Exception(PARSER_RUNTIME, new String(ANAME, String::L_TAINTED), "unknown charset"); +} + +Charset* Charsets::checkBOM(char *&body,size_t &body_size, Charset* enforced_charset){ + if((!enforced_charset || enforced_charset->isUTF8()) && (body_size>=3 && strncmp(body, "\xEF\xBB\xBF", 3)==0)){ + // skip UTF-8 signature (BOM code) + body+=3; + body_size-=3; + return &pa_UTF8_charset; + } + return enforced_charset; } -void Charsets::load_charset(Request_charsets& charsets, const String::Body ANAME, const String& afile_spec) { +void Charsets::load_charset(Request_charsets& charsets, String::Body ANAME, const String& afile_spec) { + ANAME=str_upper(ANAME.cstr(), ANAME.length()); //we know that charset? - if(Hash::get(ANAME)) + if(HashString::get(ANAME)) return; // don't load it then put(ANAME, new Charset(&charsets, ANAME, &afile_spec));