|
|
| version 1.239, 2019/09/06 10:17:07 | version 1.255, 2024/09/28 14:37:53 |
|---|---|
| Line 1 | Line 1 |
| /** @file | /** @file |
| Parser: @b string parser class. | Parser: @b string parser class. |
| Copyright (c) 2001-2017 Art. Lebedev Studio (http://www.artlebedev.com) | Copyright (c) 2001-2023 Art. Lebedev Studio (http://www.artlebedev.com) |
| Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru) | Authors: Konstantin Morshnev <moko@design.ru>, Alexandr Petrosian <paf@design.ru> |
| */ | */ |
| #include "classes.h" | #include "classes.h" |
| #include "pa_vmethod_frame.h" | #include "pa_vmethod_frame.h" |
| #include "pa_base64.h" | |
| #include "pa_request.h" | #include "pa_request.h" |
| #include "pa_vdouble.h" | #include "pa_vdouble.h" |
| Line 152 static void _bool(Request& r, MethodPara | Line 153 static void _bool(Request& r, MethodPara |
| } | } |
| static void _left(Request& r, MethodParams& params) { | static void _left(Request& r, MethodParams& params) { |
| ssize_t sn=params.as_int(0, "n must be int", r); | int sn=params.as_int(0, "n must be int", r); |
| const String& string=GET_SELF(r, VString).string(); | const String& string=GET_SELF(r, VString).string(); |
| r.write(sn<0 ? string : string.mid(r.charsets.source(), 0, (size_t)sn)); | r.write(sn<0 ? string : string.mid(r.charsets.source(), 0, sn)); |
| } | } |
| static void _right(Request& r, MethodParams& params) { | static void _right(Request& r, MethodParams& params) { |
| ssize_t sn=params.as_int(0, "n must be int", r); | int sn=params.as_int(0, "n must be int", r); |
| if(sn>0){ | if(sn>0){ |
| size_t n=(size_t)sn; | size_t n=sn; |
| const String& string=GET_SELF(r, VString).string(); | const String& string=GET_SELF(r, VString).string(); |
| size_t length=string.length(r.charsets.source()); | size_t length=string.length(r.charsets.source()); |
| r.write(n<length ? string.mid(r.charsets.source(), length-n, length, length) : string); | r.write(n<length ? string.mid(r.charsets.source(), length-n, length, length) : string); |
| Line 170 static void _right(Request& r, MethodPar | Line 171 static void _right(Request& r, MethodPar |
| static void _mid(Request& r, MethodParams& params) { | static void _mid(Request& r, MethodParams& params) { |
| const String& string=GET_SELF(r, VString).string(); | const String& string=GET_SELF(r, VString).string(); |
| ssize_t sbegin=params.as_int(0, "p must be int", r); | int begin=params.as_int(0, "p must be int", r); |
| if(sbegin<0) | if(begin<0) |
| throw Exception(PARSER_RUNTIME, 0, "p(%d) must be >=0", sbegin); | throw Exception(PARSER_RUNTIME, 0, "p(%d) must be >=0", begin); |
| size_t begin=(size_t)sbegin; | |
| size_t end; | size_t end; |
| size_t length=0; | size_t length=0; |
| if(params.count()>1) { | if(params.count()>1) { |
| ssize_t sn=params.as_int(1, "n must be int", r); | int n=params.as_int(1, "n must be int", r); |
| if(sn<0) | if(n<0) |
| throw Exception(PARSER_RUNTIME, 0, "n(%d) must be >=0", sn); | throw Exception(PARSER_RUNTIME, 0, "n(%d) must be >=0", n); |
| end=begin+(size_t)sn; | end=begin+n; |
| } else { | } else { |
| length=string.length(r.charsets.source()); | length=string.length(r.charsets.source()); |
| end=length; | end=length; |
| Line 194 static void _pos(Request& r, MethodParam | Line 195 static void _pos(Request& r, MethodParam |
| Value& substr=params.as_no_junction(0, "substr must not be code"); | Value& substr=params.as_no_junction(0, "substr must not be code"); |
| const String& string=GET_SELF(r, VString).string(); | const String& string=GET_SELF(r, VString).string(); |
| ssize_t offset=0; | int offset=0; |
| if(params.count()>1){ | if(params.count()>1){ |
| offset=params.as_int(1, "n must be int", r); | offset=params.as_int(1, "n must be int", r); |
| if(offset<0) | if(offset<0) |
| throw Exception(PARSER_RUNTIME, 0, "n(%d) must be >=0", offset); | throw Exception(PARSER_RUNTIME, 0, "n(%d) must be >=0", offset); |
| } | } |
| r.write(*new VInt((int)string.pos(r.charsets.source(), substr.as_string(), (size_t)offset))); | r.write(*new VInt((int)string.pos(r.charsets.source(), substr.as_string(), offset))); |
| } | |
| struct Split_action_info { | |
| const String& src; | |
| ArrayString &result; | |
| }; | |
| static void split_action(Table& , ArrayString* row, int prestart, int prefinish, int poststart, int postfinish, void *info) { | |
| Split_action_info& ai=*static_cast<Split_action_info *>(info); | |
| if(row) { // begin&middle | |
| // piece from last match['prestart'] to beginning of this match['prefinish'] | |
| ai.result += &ai.src.mid(prestart, prefinish); | |
| } else // end | |
| if(poststart != postfinish) | |
| ai.result += &ai.src.mid(poststart, postfinish); | |
| } | } |
| static void split_list(MethodParams& params, int paramIndex, const String& string, ArrayString& result) { | static void split_list(Value& delim_value, const String& string, ArrayString& result) { |
| Value& delim_value=params.as_no_junction(paramIndex, "delimiter must not be code"); | if(VRegex *vregex=dynamic_cast<VRegex*>(&delim_value)){ |
| string.split(result, 0, delim_value.as_string()); | vregex->study(); |
| int matches_count=0; | |
| Split_action_info ai = { string, result }; | |
| string.match(vregex, split_action, &ai, matches_count); | |
| } else | |
| string.split(result, 0, delim_value.as_string()); | |
| } | } |
| #define SPLIT_LEFT 0x0001 | #define SPLIT_LEFT 0x0001 |
| Line 254 static Table& split_vertical(ArrayString | Line 277 static Table& split_vertical(ArrayString |
| table+=row; | table+=row; |
| } | } |
| } else { // left | } else { // left |
| Array_iterator<const String*> i(pieces); | for(ArrayString::Iterator i(pieces); i; ) { |
| while(i.has_next()) { | |
| Table::element_type row(new ArrayString); | Table::element_type row(new ArrayString); |
| *row+=i.next(); | *row+=i.next(); |
| table+=row; | table+=row; |
| Line 272 static Table& split_horizontal(ArrayStri | Line 294 static Table& split_horizontal(ArrayStri |
| for(int i=pieces.count(); --i>=0; ) | for(int i=pieces.count(); --i>=0; ) |
| *row+=pieces[i]; | *row+=pieces[i]; |
| } else { // left | } else { // left |
| for(Array_iterator<const String*> i(pieces); i.has_next(); ) | for(ArrayString::Iterator i(pieces); i; ) |
| *row+=i.next(); | *row+=i.next(); |
| } | } |
| table+=row; | table+=row; |
| Line 285 static void split_with_options(Request& | Line 307 static void split_with_options(Request& |
| size_t params_count=params.count(); | size_t params_count=params.count(); |
| ArrayString pieces; | ArrayString pieces; |
| split_list(params, 0, string, pieces); | split_list(params.as_no_junction(0, "delimiter must not be code"), string, pieces); |
| if(!bits) { | if(!bits) { |
| const String* options=0; | const String* options=0; |
| Line 363 static void _match(Request& r, MethodPar | Line 385 static void _match(Request& r, MethodPar |
| Value& regexp=params.as_no_junction(0, "regexp must not be code"); | Value& regexp=params.as_no_junction(0, "regexp must not be code"); |
| Value* options=(params_count>1)?¶ms.as_no_junction(1, OPTIONS_MUST_NOT_BE_CODE):0; | Value* options=(params_count>1)?¶ms.as_no_junction(1, OPTIONS_MUST_NOT_BE_CODE):0; |
| VRegex* vregex; | VRegex* vregex=dynamic_cast<VRegex*>(®exp); |
| VRegexCleaner vrcleaner; | VRegexCleaner vrcleaner; |
| if(Value* value=regexp.as(VREGEX_TYPE)){ | if(vregex){ |
| if(options && options->is_defined()) | if(options && options->is_defined()) |
| throw Exception(PARSER_RUNTIME, 0, "you can not specify regex-object and options together"); | throw Exception(PARSER_RUNTIME, 0, "you cannot specify regex-object and options together"); |
| vregex=static_cast<VRegex*>(value); | |
| } else { | } else { |
| vregex=new VRegex(r.charsets.source(), ®exp.as_string(), (options) ? (&options->as_string()) : 0); | vregex=new VRegex(r.charsets.source(), ®exp.as_string(), (options) ? (&options->as_string()) : 0); |
| vregex->study(); | vregex->study(); |
| Line 443 static void _lower(Request& r, MethodPar | Line 464 static void _lower(Request& r, MethodPar |
| #ifndef DOXYGEN | #ifndef DOXYGEN |
| class String_sql_event_handlers: public SQL_Driver_query_event_handlers { | class String_sql_event_handlers: public SQL_Driver_query_event_handlers { |
| const String& statement_string; const char* statement_cstr; | |
| bool got_column; | bool got_column; |
| public: | public: |
| bool got_cell; | bool got_cell; |
| const String* result; | const String* result; |
| public: | public: |
| String_sql_event_handlers( | String_sql_event_handlers(): |
| const String& astatement_string, const char* astatement_cstr): | |
| statement_string(astatement_string), statement_cstr(astatement_cstr), | |
| got_column(false), | got_column(false), |
| got_cell(false), | got_cell(false), |
| result(&String::Empty) {} | result(&String::Empty) {} |
| bool add_column(SQL_Error& error, const char* /*str*/, size_t /*length*/) { | bool add_column(SQL_Error& error, const char* /*str*/, size_t /*length*/) { |
| if(got_column) { | if(got_column) { |
| error=SQL_Error(PARSER_RUNTIME, /*statement_string,*/ "result must contain exactly one column"); | error=SQL_Error("result must contain exactly one column"); |
| return true; | return true; |
| } | } |
| got_column=true; | got_column=true; |
| Line 468 public: | Line 486 public: |
| bool add_row(SQL_Error& /*error*/) { /* ignore */ return false; } | bool add_row(SQL_Error& /*error*/) { /* ignore */ return false; } |
| bool add_row_cell(SQL_Error& error, const char* str, size_t) { | bool add_row_cell(SQL_Error& error, const char* str, size_t) { |
| if(got_cell) { | if(got_cell) { |
| error=SQL_Error(PARSER_RUNTIME, /*statement_string,*/ "result must not contain more then one row"); | error=SQL_Error("result must contain no more than one row"); |
| return true; | return true; |
| } | } |
| try { | try { |
| got_cell=true; | got_cell=true; |
| result=new String(str, String::L_TAINTED /* no length as 0x00 can be inside */ ); | result=new String(str, String::L_TAINTED /* no length as 0x00 can be inside */ ); |
| Line 524 const String* sql_result_string(Request& | Line 541 const String* sql_result_string(Request& |
| const String& statement_string=r.process_to_string(statement); | const String& statement_string=r.process_to_string(statement); |
| const char* statement_cstr=statement_string.untaint_cstr(String::L_SQL, r.connection()); | const char* statement_cstr=statement_string.untaint_cstr(String::L_SQL, r.connection()); |
| String_sql_event_handlers handlers(statement_string, statement_cstr); | String_sql_event_handlers handlers; |
| r.connection()->query( | r.connection()->query(statement_cstr, placeholders_count, placeholders, offset, limit, handlers, statement_string); |
| statement_cstr, | |
| placeholders_count, placeholders, | |
| offset, limit, | |
| handlers, | |
| statement_string); | |
| if(bind) | if(bind) |
| unmarshal_bind_updates(*bind, placeholders_count, placeholders); | unmarshal_bind_updates(*bind, placeholders_count, placeholders); |
| Line 561 static void _replace(Request& r, MethodP | Line 573 static void _replace(Request& r, MethodP |
| if(params.count()==1) { | if(params.count()==1) { |
| // ^string.replace[table] | // ^string.replace[table] |
| Table* table=params.as_table(0, "param"); | if(Table* table=params.as_table(0, "param")){ |
| Dictionary dict(*table); | Dictionary dict(*table); |
| r.write(src.replace(dict)); | r.write(src.replace(dict)); |
| } else | |
| r.write(src); | |
| } else { | } else { |
| // ^string.replace[from-string;to-string] | // ^string.replace[from-string;to-string] |
| Dictionary dict(params.as_string(0, "from must be string"), params.as_string(1, "to must be string")); | Dictionary dict(params.as_string(0, "from must be string"), params.as_string(1, "to must be string")); |
| Line 610 static void _save(Request& r, MethodPara | Line 624 static void _save(Request& r, MethodPara |
| String::Body sbody=src.cstr_to_string_body_untaint(String::L_AS_IS, r.connection(false), &r.charsets); | String::Body sbody=src.cstr_to_string_body_untaint(String::L_AS_IS, r.connection(false), &r.charsets); |
| // write | // write |
| file_write(r.charsets, r.absolute(file_name), sbody.cstr(), sbody.length(), true, do_append, asked_charset); | file_write(r.charsets, r.full_disk_path(file_name), sbody.cstr(), sbody.length(), true, do_append, asked_charset); |
| } | } |
| static void _normalize(Request& r, MethodParams&) { | static void _normalize(Request& r, MethodParams&) { |
| Line 650 static void _trim(Request& r, MethodPara | Line 664 static void _trim(Request& r, MethodPara |
| r.write(src.trim(kind, chars, &r.charsets.source())); | r.write(src.trim(kind, chars, &r.charsets.source())); |
| } | } |
| Base64Options base64_encode_options(Request& r, HashStringValue* options) { | |
| Base64Options result; | |
| if(options) { | |
| int valid_options=0; | |
| for(HashStringValue::Iterator i(*options); i; i.next()) { | |
| String::Body key=i.key(); | |
| Value* value=i.value(); | |
| if(key == "pad") { | |
| result.pad=r.process(*value).as_bool(); | |
| valid_options++; | |
| } else if(key == "wrap") { | |
| result.wrap=r.process(*value).as_bool(); | |
| valid_options++; | |
| } else if(key == "url-safe") { | |
| if(r.process(*value).as_bool()) | |
| result.set_url_safe_abc(); | |
| valid_options++; | |
| } | |
| } | |
| if(valid_options != options->count()) | |
| throw Exception(PARSER_RUNTIME, 0, CALLED_WITH_INVALID_OPTION); | |
| } | |
| return result; | |
| } | |
| Base64Options base64_decode_options(Request& r, HashStringValue* options) { | |
| Base64Options result; | |
| if(options) { | |
| int valid_options=0; | |
| for(HashStringValue::Iterator i(*options); i; i.next() ) { | |
| String::Body key=i.key(); | |
| Value* value=i.value(); | |
| if(key == "pad") { | |
| result.pad=r.process(*value).as_bool(); | |
| valid_options++; | |
| } else if(key == "strict") { | |
| result.strict=r.process(*value).as_bool(); | |
| valid_options++; | |
| } else if(key == "url-safe") { | |
| if(r.process(*value).as_bool()) | |
| result.set_url_safe_abc(); | |
| valid_options++; | |
| } | |
| } | |
| if(valid_options != options->count()) | |
| throw Exception(PARSER_RUNTIME, 0, CALLED_WITH_INVALID_OPTION); | |
| } | |
| return result; | |
| } | |
| static void _base64(Request& r, MethodParams& params) { | static void _base64(Request& r, MethodParams& params) { |
| if(&r.get_self() == string_class) { | if(&r.get_self() == string_class) { |
| // decode: ^string:base64[encoded[;$.strict(true|false)]] | // decode: ^string:base64[encoded[;options]] |
| const char* cstr=params.count() ? params.as_string(0, PARAMETER_MUST_BE_STRING).cstr() : ""; | const char* cstr=params.count() ? params.as_string(0, PARAMETER_MUST_BE_STRING).cstr() : ""; |
| char* decoded=0; | Base64Options options = base64_decode_options(r, params.count() > 1 ? params.as_hash(1) : NULL); |
| size_t length=0; | |
| bool strict=false; | char* decoded=0; |
| if(params.count() > 1) | size_t length=pa_base64_decode(cstr, strlen(cstr), decoded, options); |
| if(HashStringValue* options=params.as_hash(1)) { | |
| int valid_options=0; | |
| if(Value* vstrict=options->get(BASE64_STRICT_OPTION_NAME)) { | |
| strict=r.process(*vstrict).as_bool(); | |
| valid_options++; | |
| } | |
| if(valid_options!=options->count()) | |
| throw Exception(PARSER_RUNTIME, 0, CALLED_WITH_INVALID_OPTION); | |
| } | |
| pa_base64_decode(cstr, strlen(cstr), decoded, length, strict); | |
| if(decoded && length){ | if(decoded && length){ |
| if(memchr((const char*)decoded, 0, length)) | if(memchr(decoded, 0, length)) |
| throw Exception(PARSER_RUNTIME, 0, "Invalid \\x00 character found while decode to string. Decode it to file instead."); | throw Exception(PARSER_RUNTIME, 0, "Invalid \\x00 character found while decoding to string. Decode to file instead."); |
| fix_line_breaks(decoded, length); | fix_line_breaks(decoded, length); |
| if(length) | if(length) |
| r.write(*new String(decoded, String::L_TAINTED)); | r.write(*new String(decoded, String::L_TAINTED)); |
| } | } |
| } else { | } else { |
| // encode: ^str.base64[] | // encode: ^str.base64[options] |
| VString& self=GET_SELF(r, VString); | VString& self=GET_SELF(r, VString); |
| const char* cstr=self.string().cstr(); | const char* cstr=self.string().cstr(); |
| const char* encoded=pa_base64_encode(cstr, strlen(cstr)); | Base64Options options = base64_encode_options(r, params.count() ? params.as_hash(0) : NULL); |
| r.write(*new String(encoded, String::L_TAINTED/*once ?param=base64(something) was needed*/)); | const char* encoded=pa_base64_encode(cstr, strlen(cstr), options); |
| r.write(*new String(encoded, String::L_TAINTED /*once ?param=base64(something) was needed*/ )); | |
| } | } |
| } | } |