Annotation of parser3/src/main/pa_common.C, revision 1.87
1.15 paf 1: /** @file
1.16 paf 2: Parser: commonly functions.
3:
1.8 paf 4: Copyright(c) 2001 ArtLebedev Group(http://www.artlebedev.com)
1.85 paf 5: Author: Alexander Petrosyan <paf@design.ru>(http://paf.design.ru)
1.16 paf 6:
1.87 ! paf 7: $Id: pa_common.C,v 1.86 2001/11/09 11:06:57 paf Exp $
1.1 paf 8: */
9:
10: #include "pa_common.h"
1.2 paf 11: #include "pa_types.h"
1.4 paf 12: #include "pa_exception.h"
1.14 paf 13: #include "pa_pool.h"
14: #include "pa_globals.h"
15: #include "pa_value.h"
16: #include "pa_hash.h"
17: #include "pa_string.h"
1.1 paf 18:
1.82 paf 19: #ifndef _O_TEXT
20: # define _O_TEXT 0
21: #endif
22: #ifndef _O_BINARY
23: # define _O_BINARY 0
1.47 paf 24: #endif
1.80 paf 25: #ifndef O_TRUNC
26: # define O_TRUNC 0
27: #endif
28:
1.22 paf 29: #if _MSC_VER
1.1 paf 30:
31: int __vsnprintf(char *b, size_t s, const char *f, va_list l) {
32: int r=_vsnprintf(b, --s, f, l);
33: b[s]=0;
34: return r;
35: }
36: int __snprintf(char *b, size_t s, const char *f, ...) {
37: va_list l;
38: va_start(l, f);
39: int r=__vsnprintf(b, s, f, l);
40: va_end(l);
41: return r;
42: }
43:
44: #endif
1.2 paf 45:
1.86 paf 46: static char *strnchr(char *buf, size_t size, char c) {
47: for(; size-->0; buf++) {
48: if(*buf==c)
49: return buf;
50: }
51:
52: return 0;
53: }
54:
55: void fix_line_breaks(char *buf, size_t& size) {
1.87 ! paf 56: //_asm int 3;
1.86 paf 57: const char * const eob=buf+size;
1.87 ! paf 58: char *dest=buf;
1.72 parser 59: // fix DOS: \r\n -> \n
60: // fix Macintosh: \r -> \n
1.87 ! paf 61: char *bol=buf;
1.86 paf 62: while(char *eol=strnchr(bol, eob -bol, '\r')) {
1.72 parser 63: size_t len=eol-bol;
64: if(dest!=bol)
65: memcpy(dest, bol, len);
66: dest+=len;
67: *dest++='\n';
68:
1.87 ! paf 69: if(&eol[1]<eob && eol[1]=='\n') { // \r,\n = DOS
1.72 parser 70: bol=eol+2;
71: size--;
72: } else // \r,not \n = Macintosh
73: bol=eol+1;
74: }
75: // last piece without \r, including terminating 0
76: if(dest!=bol)
1.87 ! paf 77: memcpy(dest, bol, eob-bol);
1.72 parser 78: }
1.18 paf 79:
1.28 paf 80: char *file_read_text(Pool& pool, const String& file_spec, bool fail_on_read_problem) {
1.72 parser 81: void *result; size_t size;
82: return file_read(pool, file_spec, result, size, true, fail_on_read_problem)?(char *)result:0;
1.34 paf 83: }
84: bool file_read(Pool& pool, const String& file_spec,
1.87 ! paf 85: void*& data, size_t& data_size, bool as_text,
1.44 paf 86: bool fail_on_read_problem,
87: size_t offset, size_t limit) {
1.64 parser 88: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.62 parser 89: //printf("file_read(%s)\n", fname);
1.33 paf 90: int f;
1.2 paf 91: struct stat finfo;
1.33 paf 92:
93: // first open, next stat:
1.45 paf 94: // directory update of NTFS hard links performed on open.
1.33 paf 95: // ex:
96: // a.html:^test[] and b.html hardlink to a.html
97: // user inserts ! before ^test in a.html
98: // directory entry of b.html in NTFS not updated at once,
1.35 paf 99: // they delay update till open, so we would receive "!^test[" string
100: // if would do stat, next open.
1.34 paf 101: if(
1.72 parser 102: (f=open(fname, O_RDONLY|(as_text?_O_BINARY/*_O_TEXT*/:_O_BINARY)))>=0 &&
1.34 paf 103: stat(fname, &finfo)==0) {
1.2 paf 104: /*if(exclusive)
105: flock(f, LOCK_EX);*/
1.44 paf 106: size_t max_size=limit?min(offset+limit, finfo.st_size)-offset:finfo.st_size;
1.87 ! paf 107: int read_size;
1.47 paf 108: if(!max_size) { // eof
1.83 paf 109: if(as_text) {
110: data=pool.malloc(1);
111: *(char*)data=0;
112: } else
113: data=0;
1.47 paf 114: read_size=0;
1.59 parser 115: } else {
1.78 paf 116: data=pool.malloc(max_size+(as_text?1:0), 3);
1.59 parser 117: if(offset)
118: lseek(f, offset, SEEK_SET);
119: read_size=read(f, data, max_size);
1.47 paf 120: }
1.2 paf 121: /*if(exclusive)
122: flock(f, LOCK_UN);*/
123: close(f);
1.59 parser 124: if(!max_size) // eof
125: return true;
1.32 paf 126:
1.87 ! paf 127: if(read_size<0 || read_size>max_size)
1.73 parser 128: throw Exception(0, 0,
1.33 paf 129: &file_spec,
1.44 paf 130: "read failed: actually read %d bytes count not in [0..%lu] valid range",
131: read_size, (unsigned long)max_size); //never
1.87 ! paf 132:
! 133: data_size=read_size;
! 134: if(as_text) {
! 135: fix_line_breaks((char *)data, data_size);
! 136: // note: after fixing
! 137: ((char*&)data)[data_size]=0;
! 138: }
1.72 parser 139: return true;
1.2 paf 140: }
1.4 paf 141: if(fail_on_read_problem)
1.73 parser 142: throw Exception(0, 0,
1.33 paf 143: &file_spec,
1.54 parser 144: "read failed: %s (%d), actual filename '%s'",
145: strerror(errno), errno, fname);
1.34 paf 146: return false;
1.8 paf 147: }
148:
1.63 parser 149: static void create_dir_for_file(const String& file_spec) {
150: size_t pos_after=1;
151: int pos_before;
152: while((pos_before=file_spec.pos("/", 1, pos_after))>=0) {
1.64 parser 153: mkdir(file_spec.mid(0, pos_before).cstr(String::UL_FILE_SPEC), 0775);
1.63 parser 154: pos_after=pos_before+1;
155: }
156: }
157:
1.18 paf 158: void file_write(Pool& pool,
1.28 paf 159: const String& file_spec,
1.34 paf 160: const void *data, size_t size,
1.80 paf 161: bool as_text,
162: bool do_append/*,
1.20 paf 163: bool exclusive*/) {
1.64 parser 164: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.28 paf 165: int f;
1.80 paf 166: if(access(fname, W_OK)!=0) // no
1.63 parser 167: create_dir_for_file(file_spec);
1.50 paf 168:
1.80 paf 169: if((f=open(fname,
170: O_CREAT|O_RDWR
171: |(as_text?_O_TEXT:_O_BINARY)
172: |(do_append?O_APPEND:O_TRUNC), 0666))>=0) {
173: /*if(exclusive)
174: flock(f, LOCK_EX);*/
175:
176: if(size) write(f, data, size);
177: #if O_TRUNC==0
178: ftruncate(f, size);
1.18 paf 179: #endif
1.80 paf 180: /*if(exclusive)
181: flock(f, LOCK_UN);*/
182: close(f);
183: } else
184: throw Exception(0, 0,
185: &file_spec,
186: "write failed: %s (%d), actual filename '%s'",
187: strerror(errno), errno, fname);
1.30 paf 188: }
189:
1.63 parser 190: // throws nothing! [this is required in file_move & file_delete]
1.50 paf 191: static void rmdir(const String& file_spec, size_t pos_after) {
192: int pos_before;
193: if((pos_before=file_spec.pos("/", 1, pos_after))>=0)
194: rmdir(file_spec, pos_before+1);
195:
1.64 parser 196: rmdir(file_spec.mid(0, pos_after-1/* / */).cstr(String::UL_FILE_SPEC));
1.50 paf 197: }
1.30 paf 198: void file_delete(Pool& pool, const String& file_spec) {
1.64 parser 199: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.54 parser 200: if(unlink(fname)!=0)
1.73 parser 201: throw Exception(0, 0,
1.33 paf 202: &file_spec,
1.54 parser 203: "unlink failed: %s (%d), actual filename '%s'",
204: strerror(errno), errno, fname);
1.50 paf 205:
206: rmdir(file_spec, 1);
1.60 parser 207: }
208: void file_move(Pool& pool, const String& old_spec, const String& new_spec) {
1.64 parser 209: const char *old_spec_cstr=old_spec.cstr(String::UL_FILE_SPEC);
210: const char *new_spec_cstr=new_spec.cstr(String::UL_FILE_SPEC);
1.63 parser 211:
212: create_dir_for_file(new_spec);
213:
1.60 parser 214: if(rename(old_spec_cstr, new_spec_cstr)!=0)
1.73 parser 215: throw Exception(0, 0,
1.60 parser 216: &old_spec,
217: "rename failed: %s (%d), actual filename '%s' to '%s'",
218: strerror(errno), errno, old_spec_cstr, new_spec_cstr);
1.63 parser 219:
220: rmdir(old_spec, 1);
1.31 paf 221: }
222:
1.51 paf 223:
224: static bool entry_readable(const String& file_spec, bool need_dir) {
1.64 parser 225: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.51 paf 226: struct stat finfo;
227: if(access(fname, R_OK)==0 && stat(fname, &finfo)==0) {
1.73 parser 228: bool is_dir=finfo.st_mode&S_IFDIR != 0;
1.51 paf 229: return is_dir==need_dir;
230: }
231: return false;
232: }
1.31 paf 233: bool file_readable(const String& file_spec) {
1.51 paf 234: return entry_readable(file_spec, false);
235: }
236: bool dir_readable(const String& file_spec) {
237: return entry_readable(file_spec, true);
1.65 parser 238: }
239: String *file_readable(const String& path, const String& name) {
240: String *result=new(path.pool()) String(path);
241: *result << "/";
242: *result << name;
243: return file_readable(*result)?result:0;
1.43 paf 244: }
245: bool file_executable(const String& file_spec) {
1.64 parser 246: return access(file_spec.cstr(String::UL_FILE_SPEC), X_OK)==0;
1.44 paf 247: }
248:
1.64 parser 249: bool file_stat(const String& file_spec,
1.58 parser 250: size_t& rsize,
251: time_t& ratime,
252: time_t& rmtime,
1.64 parser 253: time_t& rctime,
254: bool fail_on_read_problem) {
1.44 paf 255: Pool& pool=file_spec.pool();
1.64 parser 256: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.44 paf 257: struct stat finfo;
258: if(stat(fname, &finfo)!=0)
1.64 parser 259: if(fail_on_read_problem)
1.73 parser 260: throw Exception(0, 0,
1.67 parser 261: &file_spec,
262: "getting file size failed: %s (%d), real filename '%s'",
263: strerror(errno), errno, fname);
1.64 parser 264: else
265: return false;
1.58 parser 266: rsize=finfo.st_size;
267: ratime=finfo.st_atime;
268: rmtime=finfo.st_mtime;
269: rctime=finfo.st_ctime;
1.64 parser 270: return true;
1.18 paf 271: }
272:
1.8 paf 273: char *getrow(char **row_ref, char delim) {
274: char *result=*row_ref;
275: if(result) {
276: *row_ref=strchr(result, delim);
277: if(*row_ref)
278: *((*row_ref)++)=0;
279: else if(!*result)
280: return 0;
281: }
282: return result;
283: }
284:
1.23 paf 285: char *lsplit(char *string, char delim) {
286: if(string) {
287: char *v=strchr(string, delim);
1.8 paf 288: if(v) {
289: *v=0;
290: return v+1;
291: }
292: }
293: return 0;
294: }
295:
296: char *lsplit(char **string_ref, char delim) {
297: char *result=*string_ref;
298: char *next=lsplit(*string_ref, delim);
299: *string_ref=next;
300: return result;
1.9 paf 301: }
302:
303: char *rsplit(char *string, char delim) {
1.18 paf 304: if(string) {
1.9 paf 305: char *v=strrchr(string, delim);
1.18 paf 306: if(v) {
1.9 paf 307: *v=0;
308: return v+1;
309: }
310: }
311: return NULL;
1.10 paf 312: }
313:
1.37 paf 314: /// @todo less stupid type detection
1.10 paf 315: char *format(Pool& pool, double value, char *fmt) {
1.78 paf 316: char *result=(char *)pool.malloc(MAX_NUMBER, 4);
1.10 paf 317: if(fmt)
318: if(strpbrk(fmt, "diouxX"))
319: if(strpbrk(fmt, "ouxX"))
1.33 paf 320: snprintf(result, MAX_NUMBER, fmt, (uint)value );
1.10 paf 321: else
1.33 paf 322: snprintf(result, MAX_NUMBER, fmt, (int)value );
1.10 paf 323: else
324: snprintf(result, MAX_NUMBER, fmt, value);
325: else
1.33 paf 326: snprintf(result, MAX_NUMBER, "%d", (int)value);
1.10 paf 327:
328: return result;
1.12 paf 329: }
330:
1.36 paf 331: size_t stdout_write(const void *buf, size_t size) {
1.12 paf 332: #ifdef WIN32
333: do{
334: int chunk_written=fwrite(buf, 1, min(8*0x400, size), stdout);
335: if(chunk_written<=0)
336: break;
337: size-=chunk_written;
1.36 paf 338: buf=((const char*)buf)+chunk_written;
1.12 paf 339: } while(size>0);
340:
341: return size;
342: #else
1.13 paf 343: return fwrite(buf, 1, size, stdout);
1.12 paf 344: #endif
1.2 paf 345: }
1.14 paf 346:
1.77 parser 347: char *unescape_chars(Pool& pool, const char *cp, int len) {
1.78 paf 348: char *s=(char *)pool.malloc(len + 1, 5);
1.14 paf 349: enum EscapeState {
1.33 paf 350: EscapeRest,
351: EscapeFirst,
1.14 paf 352: EscapeSecond
353: } escapeState=EscapeRest;
354: int escapedValue=0;
355: int srcPos=0;
356: int dstPos=0;
357: while(srcPos < len) {
358: int ch=cp[srcPos];
359: switch(escapeState) {
360: case EscapeRest:
361: if(ch=='%') {
362: escapeState=EscapeFirst;
363: } else if(ch=='+') {
364: s[dstPos++]=' ';
365: } else {
366: s[dstPos++]=ch;
367: }
368: break;
369: case EscapeFirst:
370: escapedValue=hex_value[ch] << 4;
371: escapeState=EscapeSecond;
372: break;
373: case EscapeSecond:
374: escapedValue +=hex_value[ch];
375: s[dstPos++]=escapedValue;
376: escapeState=EscapeRest;
377: break;
378: }
379: srcPos++;
380: }
381: s[dstPos]=0;
382: return s;
383: }
384:
1.52 paf 385: /// used by attributed_meaning_to_string / append_attribute_subattribute
1.40 paf 386: struct Attributed_meaning_info {
1.52 paf 387: String *header; // header line being constructed
388: String::Untaint_lang lang; // language in which to append to that line
1.40 paf 389: };
1.17 paf 390: static void append_attribute_subattribute(const Hash::Key& akey, Hash::Val *avalue,
1.14 paf 391: void *info) {
392: if(akey==VALUE_NAME)
393: return;
394:
1.40 paf 395: Attributed_meaning_info& ami=*static_cast<Attributed_meaning_info *>(info);
396:
1.14 paf 397: // ...; charset=windows1251
1.48 paf 398: *ami.header << "; ";
1.70 parser 399: ami.header->append(akey, ami.lang);
1.48 paf 400: *ami.header << "=";
1.70 parser 401: ami.header->append(static_cast<Value *>(avalue)->as_string(), ami.lang);
1.14 paf 402: }
1.49 paf 403: const String& attributed_meaning_to_string(Value& meaning,
404: String::Untaint_lang lang) {
1.20 paf 405: String &result=*new(meaning.pool()) String(meaning.pool());
1.75 parser 406: if(Hash *hash=meaning.get_hash(0)) {
1.14 paf 407: // $value(value) $subattribute(subattribute value)
408: if(Value *value=static_cast<Value *>(hash->get(*value_name)))
1.40 paf 409: result.append(value->as_string(), lang, true);
1.14 paf 410:
1.40 paf 411: Attributed_meaning_info attributed_meaning_info={
1.52 paf 412: &result,
413: lang
1.40 paf 414: };
415: hash->for_each(append_attribute_subattribute, &attributed_meaning_info);
1.14 paf 416: } else // result value
1.40 paf 417: result.append(meaning.as_string(), lang, true);
1.14 paf 418:
419: return result;
1.24 paf 420: }
421:
422: #ifdef WIN32
423: void back_slashes_to_slashes(char *s) {
424: if(s)
425: for(; *s; s++)
426: if(*s=='\\')
427: *s='/';
428: }
1.42 paf 429: /*
430: void slashes_to_back_slashes(char *s) {
431: if(s)
432: for(; *s; s++)
433: if(*s=='/')
434: *s='\\';
435: }
436: */
1.24 paf 437: #endif
1.41 paf 438:
439: bool StrEqNc(const char *s1, const char *s2, bool strict) {
440: while(true) {
441: if(!(*s1)) {
442: if(!(*s2))
443: return true;
444: else
445: return !strict;
446: } else if(!(*s2))
447: return !strict;
448: if(isalpha(*s1)) {
449: if(tolower(*s1) !=tolower(*s2))
450: return false;
451: } else if((*s1) !=(*s2))
452: return false;
453: s1++;
454: s2++;
455: }
1.57 parser 456: }
457:
1.84 paf 458: static bool isLeap(int year) {
1.57 parser 459: return !(
460: (year % 4) || ((year % 400) && !(year % 100))
461: );
462: }
463:
464: int getMonthDays(int year, int month) {
465: int monthDays[]={
466: 31,
467: isLeap(year) ? 29 : 28,
468: 31,
469: 30,
470: 31,
471: 30,
472: 31,
473: 31,
474: 30,
475: 31,
476: 30,
477: 31
478: };
479: return monthDays[month];
1.41 paf 480: }
1.69 parser 481:
482: void remove_crlf(char *start, char *end) {
483: for(char *p=start; p<end; p++)
484: switch(*p) {
485: case '\n': *p='|'; break;
486: case '\r': *p=' '; break;
487: }
1.74 parser 488: }
E-mail: