Annotation of parser3/src/main/pa_common.C, revision 1.96
1.15 paf 1: /** @file
1.16 paf 2: Parser: commonly functions.
3:
1.8 paf 4: Copyright(c) 2001 ArtLebedev Group(http://www.artlebedev.com)
1.85 paf 5: Author: Alexander Petrosyan <paf@design.ru>(http://paf.design.ru)
1.16 paf 6:
1.96 ! paf 7: $Id: pa_common.C,v 1.95 2002/01/25 11:33:46 paf Exp $
1.1 paf 8: */
9:
10: #include "pa_common.h"
1.2 paf 11: #include "pa_types.h"
1.4 paf 12: #include "pa_exception.h"
1.14 paf 13: #include "pa_pool.h"
14: #include "pa_globals.h"
15: #include "pa_value.h"
16: #include "pa_hash.h"
17: #include "pa_string.h"
1.1 paf 18:
1.93 paf 19: // some maybe-undefined constants
20:
1.82 paf 21: #ifndef _O_TEXT
22: # define _O_TEXT 0
23: #endif
24: #ifndef _O_BINARY
25: # define _O_BINARY 0
1.47 paf 26: #endif
1.80 paf 27: #ifndef O_TRUNC
28: # define O_TRUNC 0
29: #endif
30:
1.93 paf 31: // locking constants
32:
33: #ifndef LOCK_EX
34: // win32
35: # ifdef _LK_LOCK
36: # define LOCK_EX _LK_LOCK
37: # else
38: // sun
39: # ifdef F_LOCK
40: # define LOCK_EX F_LOCK
41: # else
42: # error unable to define LOCK_EX
43: # endif
44: # endif
45: #endif
46:
47: #ifndef LOCK_SH
48: // win32
49: # ifdef _LK_RLCK
50: # define LOCK_SH _LK_RLCK
51: # else
52: // sun
53: /// @todo shared lock bit. forgot where to get those F_LOCK consts group
54: # ifdef F_LOCK
55: # define LOCK_SH F_LOCK
56: # else
57: # error unable to define LOCK_SH
58: # endif
59: # endif
60: #endif
61:
62: #ifndef LOCK_UN
63: // win32
64: # ifdef _LK_UNLCK
65: # define LOCK_UN _LK_UNLCK
66: # else
67: // sun
68: # ifdef F_ULOCK
69: # define LOCK_UN F_ULOCK
70: # else
71: # error unable to define LOCK_UN
72: # endif
73: # endif
74: #endif
75:
76: #ifndef HAVE_FLOCK
77: // win32
78: #ifdef HAVE__LOCKING
79: static void flock(int fd, int operation) {
80: lseek(fd, 0, SEEK_SET);
81: while(_locking(fd, operation, 1)!=0);
82: lseek(fd, 0, SEEK_SET);
83: }
84: #else
85: // sun
86: #ifdef HAVE_LOCKF
87: static void flock(int fd, int operation) {
88: lseek(fd, 0, SEEK_SET);
89: lockf(fd, operation, 1);
90: lseek(fd, 0, SEEK_SET);
91: }
92: #else
93: #error unable to find locking func
94: #endif
95: #endif
96: #endif
97:
1.86 paf 98: static char *strnchr(char *buf, size_t size, char c) {
99: for(; size-->0; buf++) {
100: if(*buf==c)
101: return buf;
102: }
103:
104: return 0;
105: }
106:
107: void fix_line_breaks(char *buf, size_t& size) {
1.87 paf 108: //_asm int 3;
1.86 paf 109: const char * const eob=buf+size;
1.87 paf 110: char *dest=buf;
1.72 parser 111: // fix DOS: \r\n -> \n
112: // fix Macintosh: \r -> \n
1.87 paf 113: char *bol=buf;
1.86 paf 114: while(char *eol=strnchr(bol, eob -bol, '\r')) {
1.72 parser 115: size_t len=eol-bol;
116: if(dest!=bol)
117: memcpy(dest, bol, len);
118: dest+=len;
119: *dest++='\n';
120:
1.87 paf 121: if(&eol[1]<eob && eol[1]=='\n') { // \r,\n = DOS
1.72 parser 122: bol=eol+2;
123: size--;
124: } else // \r,not \n = Macintosh
125: bol=eol+1;
126: }
127: // last piece without \r, including terminating 0
128: if(dest!=bol)
1.87 paf 129: memcpy(dest, bol, eob-bol);
1.72 parser 130: }
1.18 paf 131:
1.28 paf 132: char *file_read_text(Pool& pool, const String& file_spec, bool fail_on_read_problem) {
1.72 parser 133: void *result; size_t size;
134: return file_read(pool, file_spec, result, size, true, fail_on_read_problem)?(char *)result:0;
1.34 paf 135: }
136: bool file_read(Pool& pool, const String& file_spec,
1.87 paf 137: void*& data, size_t& data_size, bool as_text,
1.44 paf 138: bool fail_on_read_problem,
139: size_t offset, size_t limit) {
1.64 parser 140: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.62 parser 141: //printf("file_read(%s)\n", fname);
1.33 paf 142: int f;
1.2 paf 143: struct stat finfo;
1.33 paf 144:
145: // first open, next stat:
1.45 paf 146: // directory update of NTFS hard links performed on open.
1.33 paf 147: // ex:
148: // a.html:^test[] and b.html hardlink to a.html
149: // user inserts ! before ^test in a.html
150: // directory entry of b.html in NTFS not updated at once,
1.35 paf 151: // they delay update till open, so we would receive "!^test[" string
152: // if would do stat, next open.
1.34 paf 153: if(
1.72 parser 154: (f=open(fname, O_RDONLY|(as_text?_O_BINARY/*_O_TEXT*/:_O_BINARY)))>=0 &&
1.34 paf 155: stat(fname, &finfo)==0) {
1.93 paf 156: flock(f, LOCK_SH);
1.44 paf 157: size_t max_size=limit?min(offset+limit, finfo.st_size)-offset:finfo.st_size;
1.87 paf 158: int read_size;
1.47 paf 159: if(!max_size) { // eof
1.83 paf 160: if(as_text) {
161: data=pool.malloc(1);
162: *(char*)data=0;
163: } else
164: data=0;
1.47 paf 165: read_size=0;
1.59 parser 166: } else {
1.78 paf 167: data=pool.malloc(max_size+(as_text?1:0), 3);
1.59 parser 168: if(offset)
169: lseek(f, offset, SEEK_SET);
170: read_size=read(f, data, max_size);
1.47 paf 171: }
1.93 paf 172: flock(f, LOCK_UN);
1.2 paf 173: close(f);
1.59 parser 174: if(!max_size) // eof
175: return true;
1.32 paf 176:
1.94 paf 177: if(read_size<0 || size_t(read_size)>max_size)
1.73 parser 178: throw Exception(0, 0,
1.33 paf 179: &file_spec,
1.44 paf 180: "read failed: actually read %d bytes count not in [0..%lu] valid range",
181: read_size, (unsigned long)max_size); //never
1.87 paf 182:
183: data_size=read_size;
184: if(as_text) {
185: fix_line_breaks((char *)data, data_size);
186: // note: after fixing
187: ((char*&)data)[data_size]=0;
188: }
1.72 parser 189: return true;
1.2 paf 190: }
1.4 paf 191: if(fail_on_read_problem)
1.73 parser 192: throw Exception(0, 0,
1.33 paf 193: &file_spec,
1.54 parser 194: "read failed: %s (%d), actual filename '%s'",
195: strerror(errno), errno, fname);
1.34 paf 196: return false;
1.8 paf 197: }
198:
1.63 parser 199: static void create_dir_for_file(const String& file_spec) {
200: size_t pos_after=1;
201: int pos_before;
202: while((pos_before=file_spec.pos("/", 1, pos_after))>=0) {
1.64 parser 203: mkdir(file_spec.mid(0, pos_before).cstr(String::UL_FILE_SPEC), 0775);
1.63 parser 204: pos_after=pos_before+1;
205: }
206: }
207:
1.96 ! paf 208: void file_action_under_lock(
1.28 paf 209: const String& file_spec,
1.96 ! paf 210: const char *action_name, void (*action)(int, void *), void *context,
1.80 paf 211: bool as_text,
1.93 paf 212: bool do_append) {
1.64 parser 213: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.28 paf 214: int f;
1.80 paf 215: if(access(fname, W_OK)!=0) // no
1.63 parser 216: create_dir_for_file(file_spec);
1.50 paf 217:
1.80 paf 218: if((f=open(fname,
219: O_CREAT|O_RDWR
220: |(as_text?_O_TEXT:_O_BINARY)
1.92 paf 221: |(do_append?O_APPEND:O_TRUNC), 0664))>=0) {
1.93 paf 222: flock(f, LOCK_EX);
1.96 ! paf 223:
! 224: try {
! 225: action(f, context);
! 226: } catch(...) {
! 227: flock(f, LOCK_UN);
! 228: close(f);
! 229: /*re*/throw;
! 230: }
1.80 paf 231:
1.93 paf 232: flock(f, LOCK_UN);
1.80 paf 233: close(f);
234: } else
235: throw Exception(0, 0,
236: &file_spec,
1.96 ! paf 237: "%s failed: %s (%d), actual filename '%s'",
! 238: action_name, strerror(errno), errno, fname);
! 239: // here should be nothing, see rethrow above
! 240: }
! 241:
! 242: #ifndef DOXYGEN
! 243: struct File_write_action_info {
! 244: const void *data; size_t size;
! 245: };
! 246: #endif
! 247: static void file_write_action(int f, void *context) {
! 248: File_write_action_info& info=*static_cast<File_write_action_info *>(context);
! 249: if(info.size)
! 250: write(f, info.data, info.size);
! 251: #if O_TRUNC==0
! 252: ftruncate(f, info.size);
! 253: #endif
! 254: }
! 255: void file_write(
! 256: const String& file_spec,
! 257: const void *data, size_t size,
! 258: bool as_text,
! 259: bool do_append) {
! 260: File_write_action_info info={data, size};
! 261: file_action_under_lock(
! 262: file_spec,
! 263: "write", file_write_action, &info,
! 264: as_text,
! 265: do_append);
1.30 paf 266: }
267:
1.63 parser 268: // throws nothing! [this is required in file_move & file_delete]
1.50 paf 269: static void rmdir(const String& file_spec, size_t pos_after) {
270: int pos_before;
271: if((pos_before=file_spec.pos("/", 1, pos_after))>=0)
272: rmdir(file_spec, pos_before+1);
273:
1.64 parser 274: rmdir(file_spec.mid(0, pos_after-1/* / */).cstr(String::UL_FILE_SPEC));
1.50 paf 275: }
1.95 paf 276: bool file_delete(const String& file_spec, bool fail_on_read_problem) {
1.64 parser 277: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.54 parser 278: if(unlink(fname)!=0)
1.93 paf 279: if(fail_on_read_problem)
280: throw Exception(0, 0,
281: &file_spec,
282: "unlink failed: %s (%d), actual filename '%s'",
283: strerror(errno), errno, fname);
284: else
285: return false;
1.50 paf 286:
287: rmdir(file_spec, 1);
1.93 paf 288: return true;
1.60 parser 289: }
1.95 paf 290: void file_move(const String& old_spec, const String& new_spec) {
1.64 parser 291: const char *old_spec_cstr=old_spec.cstr(String::UL_FILE_SPEC);
292: const char *new_spec_cstr=new_spec.cstr(String::UL_FILE_SPEC);
1.63 parser 293:
294: create_dir_for_file(new_spec);
295:
1.60 parser 296: if(rename(old_spec_cstr, new_spec_cstr)!=0)
1.73 parser 297: throw Exception(0, 0,
1.60 parser 298: &old_spec,
299: "rename failed: %s (%d), actual filename '%s' to '%s'",
300: strerror(errno), errno, old_spec_cstr, new_spec_cstr);
1.63 parser 301:
302: rmdir(old_spec, 1);
1.31 paf 303: }
304:
1.51 paf 305:
306: static bool entry_readable(const String& file_spec, bool need_dir) {
1.64 parser 307: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.51 paf 308: struct stat finfo;
309: if(access(fname, R_OK)==0 && stat(fname, &finfo)==0) {
1.73 parser 310: bool is_dir=finfo.st_mode&S_IFDIR != 0;
1.51 paf 311: return is_dir==need_dir;
312: }
313: return false;
314: }
1.31 paf 315: bool file_readable(const String& file_spec) {
1.51 paf 316: return entry_readable(file_spec, false);
317: }
318: bool dir_readable(const String& file_spec) {
319: return entry_readable(file_spec, true);
1.65 parser 320: }
321: String *file_readable(const String& path, const String& name) {
322: String *result=new(path.pool()) String(path);
323: *result << "/";
324: *result << name;
325: return file_readable(*result)?result:0;
1.43 paf 326: }
327: bool file_executable(const String& file_spec) {
1.64 parser 328: return access(file_spec.cstr(String::UL_FILE_SPEC), X_OK)==0;
1.44 paf 329: }
330:
1.64 parser 331: bool file_stat(const String& file_spec,
1.58 parser 332: size_t& rsize,
333: time_t& ratime,
334: time_t& rmtime,
1.64 parser 335: time_t& rctime,
336: bool fail_on_read_problem) {
1.44 paf 337: Pool& pool=file_spec.pool();
1.64 parser 338: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.44 paf 339: struct stat finfo;
340: if(stat(fname, &finfo)!=0)
1.64 parser 341: if(fail_on_read_problem)
1.73 parser 342: throw Exception(0, 0,
1.67 parser 343: &file_spec,
344: "getting file size failed: %s (%d), real filename '%s'",
345: strerror(errno), errno, fname);
1.64 parser 346: else
347: return false;
1.58 parser 348: rsize=finfo.st_size;
349: ratime=finfo.st_atime;
350: rmtime=finfo.st_mtime;
351: rctime=finfo.st_ctime;
1.64 parser 352: return true;
1.18 paf 353: }
354:
1.8 paf 355: char *getrow(char **row_ref, char delim) {
356: char *result=*row_ref;
357: if(result) {
358: *row_ref=strchr(result, delim);
359: if(*row_ref)
360: *((*row_ref)++)=0;
361: else if(!*result)
362: return 0;
363: }
364: return result;
365: }
366:
1.23 paf 367: char *lsplit(char *string, char delim) {
368: if(string) {
369: char *v=strchr(string, delim);
1.8 paf 370: if(v) {
371: *v=0;
372: return v+1;
373: }
374: }
375: return 0;
376: }
377:
378: char *lsplit(char **string_ref, char delim) {
379: char *result=*string_ref;
380: char *next=lsplit(*string_ref, delim);
381: *string_ref=next;
382: return result;
1.9 paf 383: }
384:
385: char *rsplit(char *string, char delim) {
1.18 paf 386: if(string) {
1.9 paf 387: char *v=strrchr(string, delim);
1.18 paf 388: if(v) {
1.9 paf 389: *v=0;
390: return v+1;
391: }
392: }
393: return NULL;
1.10 paf 394: }
395:
1.37 paf 396: /// @todo less stupid type detection
1.10 paf 397: char *format(Pool& pool, double value, char *fmt) {
1.78 paf 398: char *result=(char *)pool.malloc(MAX_NUMBER, 4);
1.10 paf 399: if(fmt)
400: if(strpbrk(fmt, "diouxX"))
401: if(strpbrk(fmt, "ouxX"))
1.33 paf 402: snprintf(result, MAX_NUMBER, fmt, (uint)value );
1.10 paf 403: else
1.33 paf 404: snprintf(result, MAX_NUMBER, fmt, (int)value );
1.10 paf 405: else
406: snprintf(result, MAX_NUMBER, fmt, value);
407: else
1.33 paf 408: snprintf(result, MAX_NUMBER, "%d", (int)value);
1.10 paf 409:
410: return result;
1.12 paf 411: }
412:
1.36 paf 413: size_t stdout_write(const void *buf, size_t size) {
1.12 paf 414: #ifdef WIN32
415: do{
416: int chunk_written=fwrite(buf, 1, min(8*0x400, size), stdout);
417: if(chunk_written<=0)
418: break;
419: size-=chunk_written;
1.36 paf 420: buf=((const char*)buf)+chunk_written;
1.12 paf 421: } while(size>0);
422:
423: return size;
424: #else
1.13 paf 425: return fwrite(buf, 1, size, stdout);
1.12 paf 426: #endif
1.2 paf 427: }
1.14 paf 428:
1.77 parser 429: char *unescape_chars(Pool& pool, const char *cp, int len) {
1.78 paf 430: char *s=(char *)pool.malloc(len + 1, 5);
1.14 paf 431: enum EscapeState {
1.33 paf 432: EscapeRest,
433: EscapeFirst,
1.14 paf 434: EscapeSecond
435: } escapeState=EscapeRest;
436: int escapedValue=0;
437: int srcPos=0;
438: int dstPos=0;
439: while(srcPos < len) {
440: int ch=cp[srcPos];
441: switch(escapeState) {
442: case EscapeRest:
443: if(ch=='%') {
444: escapeState=EscapeFirst;
445: } else if(ch=='+') {
446: s[dstPos++]=' ';
447: } else {
448: s[dstPos++]=ch;
449: }
450: break;
451: case EscapeFirst:
452: escapedValue=hex_value[ch] << 4;
453: escapeState=EscapeSecond;
454: break;
455: case EscapeSecond:
456: escapedValue +=hex_value[ch];
457: s[dstPos++]=escapedValue;
458: escapeState=EscapeRest;
459: break;
460: }
461: srcPos++;
462: }
463: s[dstPos]=0;
464: return s;
465: }
466:
1.52 paf 467: /// used by attributed_meaning_to_string / append_attribute_subattribute
1.40 paf 468: struct Attributed_meaning_info {
1.52 paf 469: String *header; // header line being constructed
470: String::Untaint_lang lang; // language in which to append to that line
1.40 paf 471: };
1.17 paf 472: static void append_attribute_subattribute(const Hash::Key& akey, Hash::Val *avalue,
1.14 paf 473: void *info) {
474: if(akey==VALUE_NAME)
475: return;
476:
1.40 paf 477: Attributed_meaning_info& ami=*static_cast<Attributed_meaning_info *>(info);
478:
1.14 paf 479: // ...; charset=windows1251
1.48 paf 480: *ami.header << "; ";
1.70 parser 481: ami.header->append(akey, ami.lang);
1.48 paf 482: *ami.header << "=";
1.70 parser 483: ami.header->append(static_cast<Value *>(avalue)->as_string(), ami.lang);
1.14 paf 484: }
1.49 paf 485: const String& attributed_meaning_to_string(Value& meaning,
486: String::Untaint_lang lang) {
1.20 paf 487: String &result=*new(meaning.pool()) String(meaning.pool());
1.75 parser 488: if(Hash *hash=meaning.get_hash(0)) {
1.14 paf 489: // $value(value) $subattribute(subattribute value)
490: if(Value *value=static_cast<Value *>(hash->get(*value_name)))
1.40 paf 491: result.append(value->as_string(), lang, true);
1.14 paf 492:
1.40 paf 493: Attributed_meaning_info attributed_meaning_info={
1.52 paf 494: &result,
495: lang
1.40 paf 496: };
497: hash->for_each(append_attribute_subattribute, &attributed_meaning_info);
1.14 paf 498: } else // result value
1.40 paf 499: result.append(meaning.as_string(), lang, true);
1.14 paf 500:
501: return result;
1.24 paf 502: }
503:
504: #ifdef WIN32
505: void back_slashes_to_slashes(char *s) {
506: if(s)
507: for(; *s; s++)
508: if(*s=='\\')
509: *s='/';
510: }
1.42 paf 511: /*
512: void slashes_to_back_slashes(char *s) {
513: if(s)
514: for(; *s; s++)
515: if(*s=='/')
516: *s='\\';
517: }
518: */
1.24 paf 519: #endif
1.41 paf 520:
521: bool StrEqNc(const char *s1, const char *s2, bool strict) {
522: while(true) {
523: if(!(*s1)) {
524: if(!(*s2))
525: return true;
526: else
527: return !strict;
528: } else if(!(*s2))
529: return !strict;
530: if(isalpha(*s1)) {
531: if(tolower(*s1) !=tolower(*s2))
532: return false;
533: } else if((*s1) !=(*s2))
534: return false;
535: s1++;
536: s2++;
537: }
1.57 parser 538: }
539:
1.84 paf 540: static bool isLeap(int year) {
1.57 parser 541: return !(
542: (year % 4) || ((year % 400) && !(year % 100))
543: );
544: }
545:
546: int getMonthDays(int year, int month) {
547: int monthDays[]={
548: 31,
549: isLeap(year) ? 29 : 28,
550: 31,
551: 30,
552: 31,
553: 30,
554: 31,
555: 31,
556: 30,
557: 31,
558: 30,
559: 31
560: };
561: return monthDays[month];
1.41 paf 562: }
1.69 parser 563:
564: void remove_crlf(char *start, char *end) {
565: for(char *p=start; p<end; p++)
566: switch(*p) {
567: case '\n': *p='|'; break;
568: case '\r': *p=' '; break;
569: }
1.91 paf 570: }
571:
572:
573: /// must be last in this file
574: #undef vsnprintf
575: int __vsnprintf(char *b, size_t s, const char *f, va_list l) {
576: if(!s)
577: return 0;
578:
579: int r;
580: // note: on win32& maybe somewhere else
581: // vsnprintf do not writes terminating 0 in 'buffer full' case, reducing
582: --s;
583: #if _MSC_VER
584: /*
585: win32:
586: mk:@MSITStore:C:\Program%20Files\Microsoft%20Visual%20Studio\MSDN\2001APR\1033\vccore.chm::/html/_crt__vsnprintf.2c_._vsnwprintf.htm
587:
588: if the number of bytes to write exceeds buffer, then count bytes are written and –1 is returned
589: */
590: r=_vsnprintf(b, s, f, l);
591: if(r<0)
592: r=s;
593: #else
594: r=vsnprintf(b, s, f, l);
595: /*
596: solaris:
597: man vsnprintf
598:
599: The snprintf() function returns the number of characters
600: formatted, that is, the number of characters that would have
601: been written to the buffer if it were large enough. If the
602: value of n is 0 on a call to snprintf(), an unspecified
603: value less than 1 is returned.
604: */
605:
606: if(r<0)
607: r=0;
608: else if(r>s)
609: r=s;
610: #endif
611: b[r]=0;
612: return r;
613: }
614:
615: int __snprintf(char *b, size_t s, const char *f, ...) {
616: va_list l;
617: va_start(l, f);
618: int r=__vsnprintf(b, s, f, l);
619: va_end(l);
620: return r;
1.74 parser 621: }
E-mail: