Annotation of parser3/src/main/pa_string.C, revision 1.172.2.21.2.5
1.45 paf 1: /** @file
1.55 paf 2: Parser: string class. @see untasize_t.C.
1.46 paf 3:
1.172.2.11 paf 4: Copyright (c) 2001-2003 ArtLebedev Group (http://www.artlebedev.com)
1.138 paf 5: Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)
1.164 paf 6: */
1.46 paf 7:
1.172.2.21.2. (paf 8:): static const char* IDENT_STRING_C="$Date: 2003/03/19 13:16:56 $";
1.4 paf 9:
1.70 paf 10: #include "pcre.h"
11:
1.12 paf 12: #include "pa_string.h"
1.22 paf 13: #include "pa_exception.h"
1.61 paf 14: #include "pa_table.h"
1.101 parser 15: #include "pa_dictionary.h"
1.132 paf 16: #include "pa_charset.h"
1.60 paf 17:
1.172.2.2 paf 18: // helpers
1.139 paf 19:
1.172.2.2 paf 20: /// String::match uses this as replace & global search table columns
1.139 paf 21:
1.172.2.4 paf 22: const int MAX_MATCH_GROUPS=100;
23:
1.172.2.14 paf 24: class String_match_table_template_columns: public ArrayString {
1.172.2.2 paf 25: public:
1.172.2.4 paf 26: String_match_table_template_columns() {
1.172.2.21.2. (paf 27:): *this+=new String("prematch");
28:): *this+=new String("match");
29:): *this+=new String("postmatch");
1.172.2.4 paf 30: for(int i=0; i<MAX_MATCH_GROUPS; i++) {
1.172.2.21.2. (paf 31:): char *cname=new(PointerFreeGC) char[3/*strlen("100")*/+1/*terminating 0*/];
32:): *this+=new String(cname, sprintf(cname, "%d", 1+i));
1.172.2.2 paf 33: }
1.172.2.21 paf 34: }
1.172.2.4 paf 35: };
36:
1.172.2.21.2. (paf 37:): Table string_match_table_template(new String_match_table_template_columns);
1.172.2.2 paf 38:
1.172.2.21.2. (paf 39:): // String::ArrayFragment methods
40:):
41:): String::ArrayFragment& String::ArrayFragment::append(const ArrayFragment& src,
42:): size_t substr_start, size_t substr_end) {
43:): if(substr_start==substr_end)
44:): return *this;
45:):
46:): size_t fragment_start=0;
47:): size_t fragment_end;
48:): for(Array_iterator<element_type> i(src); ; fragment_start=fragment_end) {
49:): const element_type& fragment=i.next();
50:): fragment_end=fragment_start+fragment.size;
51:):
52:): if(substr_start<fragment_start) // not reached fragments which may include 'substr'?
53:): continue;
54:):
55:): // found first fragment including piece of 'substr'
56:): size_t piece_end=min(substr_end, fragment_end);
57:): *this+=Fragment(fragment.lang, piece_end-substr_start);
58:):
59:): while(substr_end>fragment_end) { // are there more fragments including pieces of 'substr'?
60:): const element_type& fragment=i.next();
61:): fragment_end=fragment_start+fragment.size;
62:):
63:): if(substr_end>fragment_end) // are there still more?
64:): simple_append(Fragment(fragment.lang, fragment.size)); // appending whole fragment
65:): else { // no, it was last
66:): simple_append(Fragment(fragment.lang, substr_end-fragment_start));
67:): goto break2;
68:): }
69:): }
70:):
71:): break;
72:): }
73:): break2:
74:):
75:): return *this;
76:): }
77:): /*
78:): void String::ArrayFragment::mid(ArrayFragment& result, size_t substr_start, size_t substr_end) {
79:): }
80:): */
81:):
82:): // String methods
1.172.2.2 paf 83:
1.172.2.21.2. (paf 84:): String::String(const char* src, size_t src_size, bool tainted): body(CORD_EMPTY) {
1.41 paf 85: if(src)
1.75 paf 86: if(tainted)
87: APPEND_TAINTED(src, src_size, 0, 0);
1.41 paf 88: else
1.75 paf 89: APPEND_CLEAN(src, src_size, 0, 0);
1.1 paf 90: }
1.140 paf 91:
1.172.2.21.2. (paf 92:): String::String(const String& src): body(src.body), fragments(src.fragments) {}
1.28 paf 93:
1.13 paf 94: String& String::real_append(STRING_APPEND_PARAMS) {
1.9 paf 95: if(!src)
96: return *this;
1.26 paf 97: if(!size)
98: size=strlen(src);
99: if(!size)
1.9 paf 100: return *this;
1.122 paf 101:
1.172.2.21.2. (paf 102:): body=CORD_cat_char_star(body, src, size);
103:): fragments+=Fragment(lang, size);
1.1 paf 104:
105: return *this;
106: }
107:
1.172.2.21.2. (paf 108:): static int CORD_batched_iter_fn_generic_hash_code(const char * s, void * client_data) {
109:): uint& result=*static_cast<uint*>(client_data);
110:): generic_hash_code(result, s);
111:): return 0;
112:): };
1.16 paf 113: uint String::hash_code() const {
1.7 paf 114: uint result=0;
1.172.2.21.2. (paf 115:): CORD_iter5(body, 0, 0, CORD_batched_iter_fn_generic_hash_code, &result);
1.5 paf 116: return result;
117: }
118:
1.172.2.21.2. (paf 119:): const String& String::mid(size_t substr_start, size_t substr_end) const {
120:): String& result=*new String;
1.33 paf 121:
1.172.2.21.2. (paf 122:): substr_start=min(substr_start, size());
123:): substr_end=max(substr_start, substr_end);
124:): if(substr_start==substr_end)
125:): return result;
1.52 paf 126:
1.172.2.21.2. (paf 127:): // first: letters themselves
128:): result.body=CORD_substr(body, substr_start, substr_end-substr_start);
1.46 paf 129:
1.172.2.21.2. (paf 130:): // next: their langs
131:): result.fragments.append(fragments, substr_start, substr_end);
1.53 paf 132:
1.60 paf 133: // SAPI::log(pool(), "piece of '%s' from %d to %d is '%s'",
1.172.2.21.2. (paf 134:): //cstr(), substr_start, substr_end, result.cstr());
1.53 paf 135: return result;
1.54 paf 136: }
137:
1.172.2.21.2. (paf 138:): size_t String::pos(CORD substr,
139:): size_t this_offset, Untaint_lang lang) const {
140:): // first: letters themselves
141:): size_t substr_start=CORD_str(body, this_offset, substr);
142:): if(substr_start==CORD_NOT_FOUND)
143:): return STRING_NOT_FOUND;
144:):
145:): // next: check the lang when specified
146:):
147:): if(lang==UL_UNSPECIFIED) // ignore lang?
148:): return substr_start;
149:):
150:): // substr must be in one fragment, and fragments' lang must = lang
151:): size_t substr_end=substr_start+CORD_len(substr);
152:): size_t fragment_start=0;
153:): size_t fragment_end;
154:): for(Array_iterator<ArrayFragment::element_type> i(fragments); i.has_next(); fragment_start=fragment_end) {
155:): const Fragment& fragment=i.next();
156:): fragment_end=fragment_start+fragment.size;
157:):
158:): if(substr_start<fragment_start) // not reached fragments which may include 'result'?
159:): continue;
160:):
161:): if(substr_end>fragment_end) // end of substr OUT of current fragment?
162:): break;
163:):
164:): return fragment.lang==lang?substr_end:STRING_NOT_FOUND;
165:): }
166:):
167:): return STRING_NOT_FOUND;
1.58 paf 168: }
169:
1.172.2.21.2. (paf 170:): size_t String::pos(const String& substr,
171:): size_t this_offset, Untaint_lang lang) const {
172:): return pos(substr.body, this_offset, lang);
1.60 paf 173: }
174:
1.172.2.14 paf 175: void String::split(ArrayString& result,
1.172.2.21.2. (paf 176:): size_t& pos_after,
177:): const char* delim,
1.172.2.10 paf 178: Untaint_lang lang, int limit) {
1.125 paf 179: size_t self_size=size();
1.172.2.21.2. (paf 180:): if(size_t delim_size=strlen(delim)) {
1.60 paf 181: int pos_before;
182: // while we have 'delim'...
1.172.2.21.2. (paf 183:): for(; (pos_before=pos(delim, pos_after, lang))>=0 && limit; limit--) {
184:): result+=&mid(pos_after, pos_before);
1.60 paf 185: pos_after=pos_before+delim_size;
186: }
187: // last piece
1.124 paf 188: if(pos_after<self_size && limit) {
1.172.2.21.2. (paf 189:): result+=&mid(pos_after, self_size);
1.124 paf 190: pos_after=self_size;
1.60 paf 191: }
192: } else { // empty delim
1.172.2.21.2. (paf 193:): result+=this;
194:): pos_after+=self_size;
1.60 paf 195: }
196: }
197:
1.172.2.14 paf 198: void String::split(ArrayString& result,
1.172.2.21.2. (paf 199:): size_t& pos_after,
1.60 paf 200: const String& delim, Untaint_lang lang,
1.172.2.21.2. (paf 201:): int limit) const {
202:): if(delim) {
1.60 paf 203: int pos_before;
204: // while we have 'delim'...
205: for(; (pos_before=pos(delim, pos_after, lang))>=0 && limit; limit--) {
1.172.2.21.2. (paf 206:): result+=&mid(pos_after, pos_before);
1.60 paf 207: pos_after=pos_before+delim.size();
208: }
209: // last piece
210: if(pos_after<size() && limit) {
1.172.2.21.2. (paf 211:): result+=&mid(pos_after, size());
1.60 paf 212: pos_after=size();
213: }
214: } else { // empty delim
1.172.2.21.2. (paf 215:): result+=this;
216:): pos_after+=size();
1.60 paf 217: }
1.61 paf 218: }
219:
1.172.2.21.2. (paf 220:): static void regex_options(const String& options, int *result, bool& need_pre_post_match){
1.63 paf 221: struct Regex_option {
1.172.2.11 paf 222: const char* keyL;
223: const char* keyU;
1.63 paf 224: int clear, set;
225: int *result;
1.154 paf 226: bool *flag;
1.63 paf 227: } regex_option[]={
1.153 paf 228: {"i", "I", 0, PCRE_CASELESS, result}, // a=A
229: {"s", "S", 0, PCRE_DOTALL, result}, // \n\n$ [default]
230: {"x", "U", 0, PCRE_EXTENDED, result}, // whitespace in regex ignored
231: {"m", "M", PCRE_DOTALL, PCRE_MULTILINE, result}, // ^aaa\n$^bbb\n$
232: {"g", "G", 0, true, result+1}, // many rows
1.154 paf 233: {"'", 0, 0, 0, 0, &need_pre_post_match},
234: {0}
1.63 paf 235: };
1.171 paf 236: result[0]=PCRE_EXTRA | PCRE_DOTALL | PCRE_DOLLAR_ENDONLY;
1.63 paf 237: result[1]=0;
238:
239: if(options)
1.153 paf 240: for(Regex_option *o=regex_option; o->keyL; o++)
1.172.2.21.2. (paf 241:): if(options.pos(o->keyL)>=0
242:): || (o->keyU && options.pos(o->keyU)>=0)) {
1.154 paf 243: if(o->flag)
244: *o->flag=true;
245: else { // result
246: *o->result &= ~o->clear;
247: *o->result |= o->set;
248: }
1.63 paf 249: }
250: }
251:
1.172.2.21.2. (paf 252:): Table* String::match(Charset& source_charset,
1.172.2.4 paf 253: const String& regexp,
1.172.2.21.2. (paf 254:): const String& options,
1.172.2.4 paf 255: Row_action row_action, void *info,
1.172.2.20 paf 256: bool& just_matched) const {
1.172.2.21.2. (paf 257:): if(!regexp)
258:): throw Exception(0,
259:): 0,
1.73 paf 260: "regexp is empty");
1.154 paf 261:
1.172.2.21.2. (paf 262:): const char* pattern=regexp.cstr();
1.172.2.11 paf 263: const char* errptr;
1.62 paf 264: int erroffset;
1.172.2.21.2. (paf 265:): bool need_pre_post_match=false;
1.154 paf 266: int option_bits[2]; regex_options(options, option_bits, need_pre_post_match);
1.172.2.20 paf 267: bool global=option_bits[1]!=0;
1.172.2.21.2. (paf 268:): pcre *code=pcre_compile(pattern, option_bits[0],
1.62 paf 269: &errptr, &erroffset,
1.172.2.1 paf 270: source_charset.pcre_tables);
1.62 paf 271:
1.67 paf 272: if(!code)
1.172.2.21.2. (paf 273:): throw Exception(0,
274:): ®exp.mid(erroffset, regexp.size()),
1.74 paf 275: "regular expression syntax error - %s", errptr);
1.62 paf 276:
1.172.2.20 paf 277: int subpatterns=pcre_info(code, 0, 0);
278: if(subpatterns<0) {
1.100 parser 279: pcre_free(code);
1.149 paf 280: throw Exception(0,
1.172.2.21.2. (paf 281:): ®exp,
1.76 paf 282: "pcre_info error (%d)",
1.172.2.20 paf 283: subpatterns);
1.63 paf 284: }
285:
1.172.2.21.2. (paf 286:): C subject=cstr();
1.172.2.4 paf 287: const int ovecsize=(1/*match*/+MAX_MATCH_GROUPS)*3;
1.155 paf 288: int ovector[ovecsize];
289:
290: // create table
1.172.2.21.2. (paf 291:): Table* table=new Table(string_match_table_template);
1.63 paf 292:
1.64 paf 293: int exec_option_bits=0;
1.154 paf 294: int prestart=0;
295: int poststart=0;
296: int postfinish=size();
1.63 paf 297: while(true) {
298: int exec_substrings=pcre_exec(code, 0,
1.172.2.21.2. (paf 299:): subject, subject.size, prestart,
1.64 paf 300: exec_option_bits, ovector, ovecsize);
1.63 paf 301:
302: if(exec_substrings==PCRE_ERROR_NOMATCH) {
1.100 parser 303: pcre_free(code);
1.172.2.21.2. (paf 304:): row_action(table, 0/*last time, no raw*/, 0, 0, poststart, postfinish, info);
1.172.2.20 paf 305: if(global || subpatterns)
306: return table; // global or with subpatterns=true+result
307: else {
1.172.2.21.2. (paf 308:): just_matched=false; return 0; // not global=no result
1.172.2.20 paf 309: }
1.63 paf 310: }
311:
312: if(exec_substrings<0) {
1.100 parser 313: pcre_free(code);
1.172.2.21.2. (paf 314:): throw Exception(0,
315:): ®exp,
1.76 paf 316: "regular expression execute error (%d)",
1.63 paf 317: exec_substrings);
318: }
319:
1.154 paf 320: int prefinish=ovector[0];
321: poststart=ovector[1];
1.172.2.21.2. (paf 322:): ArrayString* row=new ArrayString;
1.172.2.4 paf 323: if(need_pre_post_match) {
1.172.2.21.2. (paf 324:): *row+=&mid(0, prefinish); // .prematch column value
325:): *row+=&mid(prefinish, poststart); // .match
326:): *row+=&mid(poststart, postfinish); // .postmatch
1.172.2.4 paf 327: } else {
1.172.2.21.2. (paf 328:): *row+=0; // .prematch column value
329:): *row+=0; // .match
330:): *row+=0; // .postmatch
1.172.2.4 paf 331: }
1.63 paf 332:
333: for(int i=1; i<exec_substrings; i++) {
1.69 paf 334: // -1:-1 case handled peacefully by mid() itself
1.172.2.21.2. (paf 335:): *row+=&mid(ovector[i*2+0], ovector[i*2+1]); // .i column value
1.63 paf 336: }
337:
1.172.2.20 paf 338: row_action(table, row, prestart, prefinish, poststart, postfinish, info);
1.63 paf 339:
1.172.2.20 paf 340: if(!global || prestart==poststart) { // not global | going to hang
1.100 parser 341: pcre_free(code);
1.172.2.21.2. (paf 342:): row_action(table, 0/*last time, no row*/, 0, 0, poststart, postfinish, info);
1.172.2.20 paf 343: return table;
1.63 paf 344: }
1.154 paf 345: prestart=poststart;
1.63 paf 346:
347: /*
348: if(option_bits[0] & PCRE_MULTILINE)
1.64 paf 349: exec_option_bits|=PCRE_NOTBOL; // start of subject+startoffset not BOL
1.63 paf 350: */
351: }
1.82 parser 352: }
353:
1.172.2.21.2. (paf 354:): String& String::change_case(Charset& source_charset, Change_case_kind kind) {
355:): String& result=*new String();
1.172.2.4 paf 356:
1.172.2.1 paf 357: const unsigned char *tables=source_charset.pcre_tables;
1.82 parser 358:
359: const unsigned char *a;
360: const unsigned char *b;
361: switch(kind) {
362: case CC_UPPER:
363: a=tables+lcc_offset;
364: b=tables+fcc_offset;
365: break;
366: case CC_LOWER:
367: a=tables+lcc_offset;
368: b=0;
369: break;
370: default:
1.172.2.21.2. (paf 371:): throw Exception(0,
372:): this,
1.82 parser 373: "unknown change case kind #%d",
374: static_cast<int>(kind)); // never
375: a=b=0; // calm, compiler
376: break; // never
377: }
378:
1.172.2.21.2. (paf 379:): C new_cstr=cstr();
380:): const char *end=new_cstr+new_cstr.size;
381:): char *dest=new_cstr;
382:): for(const char* current=new_cstr; current<end; current++) {
383:): unsigned char c=a[(unsigned char)*current];
384:): if(b)
385:): c=b[c];
1.82 parser 386:
1.172.2.21.2. (paf 387:): *dest++=(char)c;
388:): }
389:): result.body=new_cstr;
390:): result.fragments.append(fragments, 0, fragments.count());
1.89 parser 391:
1.101 parser 392: return result;
393: }
394:
1.172.2.21.2. (paf 395:): const String& String::replace(const Dictionary& dict) const {
396:): String& result=*new String();
397:): C old_cstr=cstr();
398:): const char* current=old_cstr;
399:): size_t old_pos=0;
400:):
401:): char *new_cstr=new(PointerFreeGC) char[(size_t)ceil(old_cstr.size*dict.max_ratio())];
402:): char *dest=new_cstr;
403:): size_t remaining_size=old_cstr.size;
404:): do {
405:): if(Table::element_type row=dict.first_that_starts(current, remaining_size)) {
406:): { // prematch
407:): size_t now_pos=current-old_cstr;
408:): if(now_pos!=old_pos) {
409:): result.fragments.append(fragments, old_pos, now_pos);
410:): old_pos=now_pos;
411:): }
1.101 parser 412: }
413:
1.172.2.21.2. (paf 414:): const String* a=row->get(0); size_t a_size=a->size();
415:): // skip 'a' in 'current', in fragment lang index && reduce work size
416:): current+=a_size; old_pos+=a_size; remaining_size-=a_size;
417:):
418:): if(row->count()>1) { // are there any b?
419:): const String* b=row->get(1); size_t b_size=b->size();
420:): if(b_size) {
421:): // write 'b' to 'dest' && skip 'b' in 'dest'
422:): b->store_to(dest, String::UL_AS_IS); dest+=b_size;
1.170 paf 423:
1.172.2.21.2. (paf 424:): // append match fragments
425:): result.fragments.append(b->fragments, 0, b->fragments.count());
426:): }
427:): }
428:): } else {
429:): // write a char to b && reduce work size
430:): *dest++=*current++; remaining_size--;
431:): }
432:): } while(remaining_size);
1.156 paf 433:
1.172.2.21.2. (paf 434:): { // postmatch
435:): size_t now_pos=current-old_cstr;
436:): if(now_pos!=old_pos) // have something at end?
437:): result.fragments.append(fragments, old_pos, now_pos-old_pos);
438:): }
1.156 paf 439:
1.172.2.21.2. (paf 440:): result.body=new_cstr;
1.89 parser 441: return result;
442: }
443:
1.172.2.21.2. (paf 444:): double String::as_double() const {
1.89 parser 445: double result;
1.172.2.4 paf 446: char buf[MAX_STRING];
447: if(size()>MAX_STRING-1)
448: throw Exception("number.format",
1.172.2.21.2. (paf 449:): this,
1.172.2.4 paf 450: "invalid number too long a string (%u>%u)", size(), MAX_STRING-1);
1.172.2.5 paf 451: char *eol=store_to(buf, String::UL_AS_IS); *eol=0;
1.172.2.11 paf 452: const char* cstr=buf;
1.172.2.4 paf 453:
1.161 paf 454: while(*cstr && isspace(*cstr))
455: cstr++;
456: if(!*cstr)
1.162 paf 457: return 0;
1.161 paf 458:
1.102 parser 459: char *error_pos;
1.89 parser 460: // 0xABC
1.99 parser 461: if(cstr[0]=='0')
462: if(cstr[1]=='x' || cstr[1]=='X')
463: result=(double)(unsigned long)strtol(cstr, &error_pos, 0);
464: else
1.102 parser 465: result=(double)strtod(cstr+1/*skip leading 0*/, &error_pos);
1.89 parser 466: else
1.99 parser 467: result=(double)strtod(cstr, &error_pos);
1.89 parser 468:
1.159 paf 469: while(char c=*error_pos++)
470: if(!isspace(c))
471: throw Exception("number.format",
1.172.2.21.2. (paf 472:): this,
1.159 paf 473: "invalid number (double)");
1.89 parser 474:
475: return result;
476: }
1.172.2.21.2. (paf 477:): int String::as_int() const {
1.89 parser 478: int result;
1.172.2.4 paf 479: char buf[MAX_STRING];
480: if(size()>MAX_STRING-1)
481: throw Exception("number.format",
1.172.2.21.2. (paf 482:): this,
1.172.2.4 paf 483: "invalid number too long a string (%u>%u)", size(), MAX_STRING-1);
1.172.2.5 paf 484: char *eol=store_to(buf, String::UL_AS_IS); *eol=0;
1.172.2.11 paf 485: const char* cstr=buf;
1.172.2.4 paf 486:
1.161 paf 487: while(*cstr && isspace(*cstr))
488: cstr++;
489: if(!*cstr)
1.162 paf 490: return 0;
1.161 paf 491:
1.102 parser 492: char *error_pos;
1.89 parser 493: // 0xABC
1.99 parser 494: if(cstr[0]=='0')
495: if(cstr[1]=='x' || cstr[1]=='X')
496: result=(int)(unsigned long)strtol(cstr, &error_pos, 0);
497: else
1.102 parser 498: result=(int)strtol(cstr+1/*skip leading 0*/, &error_pos, 0);
1.89 parser 499: else
500: result=(int)strtol(cstr, &error_pos, 0);
501:
1.159 paf 502: while(char c=*error_pos++)
503: if(!isspace(c))
504: throw Exception("number.format",
1.172.2.21.2. (paf 505:): this,
1.159 paf 506: "invalid number (int)");
1.82 parser 507:
508: return result;
1.61 paf 509: }
1.113 parser 510:
1.172.2.4 paf 511: inline void uint2uchars(uint word, uchar *bytes) {
512: bytes[0]=word&0xFF;
513: bytes[1]=(word>>8)&0xFF;
514: bytes[2]=(word>>16)&0xFF;
515: bytes[3]=(word>>24)&0xFF;
516: }
517: inline uint uchars2uint(uchar *bytes) {
518: return bytes[3]<<24
519: | bytes[2]<<16
520: | bytes[1]<<8
521: | bytes[0];
522: }
523:
1.172.2.21.2. (paf 524:): static int CORD_batched_iter_fn_append(const char* s, void* client_data) {
525:): char*& cur=*static_cast<char**>(client_data);
526:):
527:): size_t size=strlen(s);
528:): memcpy(cur, s, size); cur+=size;
529:): return 0;
530:): };
531:): String::C String::serialize(size_t prolog_size) const {
532:): size_t buf_size=
1.113 parser 533: prolog_size
1.172.2.21.2. (paf 534:): +fragments.count()*(sizeof(Untaint_lang)+sizeof(size_t))
1.113 parser 535: +size();
1.172.2.21.2. (paf 536:): C result(new(PointerFreeGC) char[buf_size], buf_size);
537:):
538:): // 1: prolog
539:): char *cur=result.str+prolog_size;
540:):
541:):
542:): // 2: fragments.count
543:): size_t fragments_count=fragments.count();
544:): memcpy(cur, &fragments_count, sizeof(fragments_count)); cur+=sizeof(fragments_count);
1.113 parser 545:
1.172.2.21.2. (paf 546:): // 3: lang info
547:): for(Array_iterator<ArrayFragment::element_type> i(fragments); i.has_next(); ) {
548:): const Fragment& fragment=i.next();
1.123 paf 549: // lang
1.172.2.21.2. (paf 550:): memcpy(cur, &fragment.lang, sizeof(fragment.lang)); cur+=sizeof(fragment.lang);
1.123 paf 551: // size
1.172.2.21.2. (paf 552:): memcpy(cur, &fragment.size, sizeof(fragment.size)); cur+=sizeof(fragment.size);
553:): }
554:):
555:): // 4: letters
556:): CORD_iter5(body, 0, 0, CORD_batched_iter_fn_append, &cur);
557:):
558:): return result;
1.113 parser 559: }
1.172.2.11 paf 560: bool String::deserialize(size_t prolog_size, void *buf, size_t buf_size, const char* file) {
1.135 paf 561: if(buf_size<=prolog_size)
1.148 paf 562: return false;
1.113 parser 563: buf_size-=prolog_size;
564:
1.172.2.21.2. (paf 565:): // 1: prolog
566:): const char *cur=(const char *)buf+prolog_size;
1.148 paf 567:
1.172.2.21.2. (paf 568:): // 2: fragments.count
569:): if(buf_size<sizeof(size_t)) // fragments.count don't fit?
570:): return false;
571:): size_t fragments_count=*reinterpret_cast<const size_t*>(cur); cur+=sizeof(size_t);
572:): buf_size-=sizeof(size_t);
1.128 paf 573:
1.172.2.21.2. (paf 574:): // 3: lang info
575:): size_t total_size=0;
576:): for(size_t f=0; f<fragments_count; f++) {
577:): size_t piece_size=sizeof(Untaint_lang)+sizeof(size_t);
578:): if(buf_size<piece_size) // lang+size
1.148 paf 579: return false;
580:
1.172.2.21.2. (paf 581:): Untaint_lang lang=*reinterpret_cast<const Untaint_lang *>(cur); cur+=sizeof(Untaint_lang);
582:): size_t fragment_size=*reinterpret_cast<const size_t*>(cur); cur+=sizeof(size_t);
583:): fragments+=Fragment(lang, fragment_size);
584:): total_size+=fragment_size;
1.113 parser 585:
586: buf_size-=piece_size;
587: }
1.172.2.21.2. (paf 588:):
589:): // 4: letters
590:): if(buf_size!=total_size)
591:): return false;
592:):
593:): body=CORD_cat_char_star(CORD_EMPTY, cur, buf_size);
594:):
1.148 paf 595: return true;
1.113 parser 596: }
E-mail: