Annotation of parser3/src/main/pa_common.C, revision 1.98
1.15 paf 1: /** @file
1.16 paf 2: Parser: commonly functions.
3:
1.8 paf 4: Copyright(c) 2001 ArtLebedev Group(http://www.artlebedev.com)
1.85 paf 5: Author: Alexander Petrosyan <paf@design.ru>(http://paf.design.ru)
1.16 paf 6:
1.98 ! paf 7: $Id: pa_common.C,v 1.97 2002/02/05 09:32:43 paf Exp $
1.1 paf 8: */
9:
10: #include "pa_common.h"
1.2 paf 11: #include "pa_types.h"
1.4 paf 12: #include "pa_exception.h"
1.14 paf 13: #include "pa_pool.h"
14: #include "pa_globals.h"
15: #include "pa_value.h"
16: #include "pa_hash.h"
17: #include "pa_string.h"
1.1 paf 18:
1.98 ! paf 19: #ifdef WIN32
! 20: # include <windows.h>
! 21: #endif
! 22:
1.93 paf 23: // some maybe-undefined constants
24:
1.82 paf 25: #ifndef _O_TEXT
26: # define _O_TEXT 0
27: #endif
28: #ifndef _O_BINARY
29: # define _O_BINARY 0
1.47 paf 30: #endif
1.80 paf 31: #ifndef O_TRUNC
32: # define O_TRUNC 0
33: #endif
34:
1.93 paf 35: // locking constants
36:
1.98 ! paf 37: // win32
! 38: #ifdef _LK_NBLCK
! 39: # define TEST_LOCK_EX _LK_NBLCK
! 40: #else
! 41: // *
! 42: # if defined LOCK_EX && defined LOCK_NB
! 43: # define TEST_LOCK_EX (LOCK_EX || LOCK_NB)
! 44: # else
! 45: // sun
! 46: # ifdef F_TLOCK
! 47: # define TEST_LOCK_EX F_TLOCK
! 48: # else
! 49: # error unable to define TEST_LOCK_EX
! 50: # endif
! 51: # endif
! 52: #endif
! 53:
1.93 paf 54: #ifndef LOCK_EX
55: // win32
56: # ifdef _LK_LOCK
57: # define LOCK_EX _LK_LOCK
58: # else
59: // sun
60: # ifdef F_LOCK
61: # define LOCK_EX F_LOCK
62: # else
63: # error unable to define LOCK_EX
64: # endif
65: # endif
66: #endif
67:
68: #ifndef LOCK_SH
69: // win32
70: # ifdef _LK_RLCK
71: # define LOCK_SH _LK_RLCK
72: # else
73: // sun
74: /// @todo shared lock bit. forgot where to get those F_LOCK consts group
75: # ifdef F_LOCK
76: # define LOCK_SH F_LOCK
77: # else
78: # error unable to define LOCK_SH
79: # endif
80: # endif
81: #endif
82:
83: #ifndef LOCK_UN
84: // win32
85: # ifdef _LK_UNLCK
86: # define LOCK_UN _LK_UNLCK
87: # else
88: // sun
89: # ifdef F_ULOCK
90: # define LOCK_UN F_ULOCK
91: # else
92: # error unable to define LOCK_UN
93: # endif
94: # endif
95: #endif
96:
97: #ifndef HAVE_FLOCK
1.98 ! paf 98: static int flock(int fd, int operation) {
! 99: lseek(fd, 0, SEEK_SET);
1.93 paf 100: // win32
101: #ifdef HAVE__LOCKING
1.98 ! paf 102: int result=_locking(fd, operation, 1);
1.93 paf 103: #else
104: // sun
105: #ifdef HAVE_LOCKF
1.98 ! paf 106: int result=lockf(fd, operation, 1);
1.93 paf 107: #else
1.98 ! paf 108: # error unable to find locking func
1.93 paf 109: #endif
110: #endif
1.98 ! paf 111: lseek(fd, 0, SEEK_SET);
! 112: return result;
! 113: }
1.93 paf 114: #endif
115:
1.86 paf 116: static char *strnchr(char *buf, size_t size, char c) {
117: for(; size-->0; buf++) {
118: if(*buf==c)
119: return buf;
120: }
121:
122: return 0;
123: }
124:
125: void fix_line_breaks(char *buf, size_t& size) {
1.87 paf 126: //_asm int 3;
1.86 paf 127: const char * const eob=buf+size;
1.87 paf 128: char *dest=buf;
1.72 parser 129: // fix DOS: \r\n -> \n
130: // fix Macintosh: \r -> \n
1.87 paf 131: char *bol=buf;
1.86 paf 132: while(char *eol=strnchr(bol, eob -bol, '\r')) {
1.72 parser 133: size_t len=eol-bol;
134: if(dest!=bol)
135: memcpy(dest, bol, len);
136: dest+=len;
137: *dest++='\n';
138:
1.87 paf 139: if(&eol[1]<eob && eol[1]=='\n') { // \r,\n = DOS
1.72 parser 140: bol=eol+2;
141: size--;
142: } else // \r,not \n = Macintosh
143: bol=eol+1;
144: }
145: // last piece without \r, including terminating 0
146: if(dest!=bol)
1.87 paf 147: memcpy(dest, bol, eob-bol);
1.72 parser 148: }
1.18 paf 149:
1.28 paf 150: char *file_read_text(Pool& pool, const String& file_spec, bool fail_on_read_problem) {
1.72 parser 151: void *result; size_t size;
152: return file_read(pool, file_spec, result, size, true, fail_on_read_problem)?(char *)result:0;
1.34 paf 153: }
154: bool file_read(Pool& pool, const String& file_spec,
1.87 paf 155: void*& data, size_t& data_size, bool as_text,
1.44 paf 156: bool fail_on_read_problem,
157: size_t offset, size_t limit) {
1.64 parser 158: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.62 parser 159: //printf("file_read(%s)\n", fname);
1.33 paf 160: int f;
1.2 paf 161: struct stat finfo;
1.33 paf 162:
163: // first open, next stat:
1.45 paf 164: // directory update of NTFS hard links performed on open.
1.33 paf 165: // ex:
166: // a.html:^test[] and b.html hardlink to a.html
167: // user inserts ! before ^test in a.html
168: // directory entry of b.html in NTFS not updated at once,
1.35 paf 169: // they delay update till open, so we would receive "!^test[" string
170: // if would do stat, next open.
1.98 ! paf 171: if((f=open(fname, O_RDONLY|(as_text?_O_TEXT:_O_BINARY)))>=0) {
1.93 paf 172: flock(f, LOCK_SH);
1.98 ! paf 173: if(stat(fname, &finfo)!=0) {
! 174: Exception e(0, 0,
! 175: &file_spec,
! 176: "stat failed: %s (%d), actual filename '%s'",
! 177: strerror(errno), errno, fname);
! 178: flock(f, LOCK_UN);
! 179: close(f);
! 180: if(fail_on_read_problem)
! 181: throw e;
! 182: return false;
! 183: }
! 184: size_t max_size=limit?min(offset+limit, (size_t)finfo.st_size)-offset:finfo.st_size;
1.47 paf 185: if(!max_size) { // eof
1.83 paf 186: if(as_text) {
187: data=pool.malloc(1);
188: *(char*)data=0;
189: } else
190: data=0;
1.98 ! paf 191: data_size=0;
1.59 parser 192: } else {
1.78 paf 193: data=pool.malloc(max_size+(as_text?1:0), 3);
1.59 parser 194: if(offset)
195: lseek(f, offset, SEEK_SET);
1.98 ! paf 196: data_size=read(f, data, max_size);
1.47 paf 197: }
1.93 paf 198: flock(f, LOCK_UN);
1.2 paf 199: close(f);
1.59 parser 200: if(!max_size) // eof
201: return true;
1.32 paf 202:
1.98 ! paf 203: if(int(data_size)<0 || data_size>max_size)
1.73 parser 204: throw Exception(0, 0,
1.33 paf 205: &file_spec,
1.44 paf 206: "read failed: actually read %d bytes count not in [0..%lu] valid range",
1.98 ! paf 207: data_size, (unsigned long)max_size); //never
1.87 paf 208:
209: if(as_text) {
210: fix_line_breaks((char *)data, data_size);
211: // note: after fixing
212: ((char*&)data)[data_size]=0;
213: }
1.72 parser 214: return true;
1.2 paf 215: }
1.4 paf 216: if(fail_on_read_problem)
1.73 parser 217: throw Exception(0, 0,
1.33 paf 218: &file_spec,
1.54 parser 219: "read failed: %s (%d), actual filename '%s'",
220: strerror(errno), errno, fname);
1.34 paf 221: return false;
1.8 paf 222: }
223:
1.63 parser 224: static void create_dir_for_file(const String& file_spec) {
225: size_t pos_after=1;
226: int pos_before;
227: while((pos_before=file_spec.pos("/", 1, pos_after))>=0) {
1.64 parser 228: mkdir(file_spec.mid(0, pos_before).cstr(String::UL_FILE_SPEC), 0775);
1.63 parser 229: pos_after=pos_before+1;
230: }
231: }
232:
1.98 ! paf 233: bool file_write_action_under_lock(
1.28 paf 234: const String& file_spec,
1.96 paf 235: const char *action_name, void (*action)(int, void *), void *context,
1.80 paf 236: bool as_text,
1.98 ! paf 237: bool do_append,
! 238: bool do_block) {
1.64 parser 239: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.28 paf 240: int f;
1.80 paf 241: if(access(fname, W_OK)!=0) // no
1.63 parser 242: create_dir_for_file(file_spec);
1.50 paf 243:
1.80 paf 244: if((f=open(fname,
245: O_CREAT|O_RDWR
246: |(as_text?_O_TEXT:_O_BINARY)
1.98 ! paf 247: |(do_append?O_APPEND:0), 0664))>=0) {
! 248: if(flock(f, do_block?LOCK_EX:TEST_LOCK_EX)!=0) {
! 249: close(f);
! 250: return false;
! 251: }
1.96 paf 252:
253: try {
254: action(f, context);
255: } catch(...) {
1.98 ! paf 256: #if O_TRUNC==0
! 257: ftruncate(f, tell(f));
! 258: #endif
1.96 paf 259: flock(f, LOCK_UN);
260: close(f);
261: /*re*/throw;
262: }
1.80 paf 263:
1.98 ! paf 264: #if O_TRUNC==0
! 265: ftruncate(f, tell(f));
! 266: #endif
1.93 paf 267: flock(f, LOCK_UN);
1.80 paf 268: close(f);
1.98 ! paf 269: return true;
1.80 paf 270: } else
271: throw Exception(0, 0,
272: &file_spec,
1.96 paf 273: "%s failed: %s (%d), actual filename '%s'",
274: action_name, strerror(errno), errno, fname);
275: // here should be nothing, see rethrow above
276: }
277:
278: #ifndef DOXYGEN
279: struct File_write_action_info {
280: const void *data; size_t size;
281: };
282: #endif
283: static void file_write_action(int f, void *context) {
284: File_write_action_info& info=*static_cast<File_write_action_info *>(context);
285: if(info.size)
286: write(f, info.data, info.size);
287: }
288: void file_write(
289: const String& file_spec,
290: const void *data, size_t size,
291: bool as_text,
292: bool do_append) {
293: File_write_action_info info={data, size};
1.98 ! paf 294: file_write_action_under_lock(
1.96 paf 295: file_spec,
296: "write", file_write_action, &info,
297: as_text,
298: do_append);
1.30 paf 299: }
300:
1.63 parser 301: // throws nothing! [this is required in file_move & file_delete]
1.50 paf 302: static void rmdir(const String& file_spec, size_t pos_after) {
303: int pos_before;
304: if((pos_before=file_spec.pos("/", 1, pos_after))>=0)
305: rmdir(file_spec, pos_before+1);
306:
1.64 parser 307: rmdir(file_spec.mid(0, pos_after-1/* / */).cstr(String::UL_FILE_SPEC));
1.50 paf 308: }
1.95 paf 309: bool file_delete(const String& file_spec, bool fail_on_read_problem) {
1.64 parser 310: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.54 parser 311: if(unlink(fname)!=0)
1.93 paf 312: if(fail_on_read_problem)
313: throw Exception(0, 0,
314: &file_spec,
315: "unlink failed: %s (%d), actual filename '%s'",
316: strerror(errno), errno, fname);
317: else
318: return false;
1.50 paf 319:
320: rmdir(file_spec, 1);
1.93 paf 321: return true;
1.60 parser 322: }
1.95 paf 323: void file_move(const String& old_spec, const String& new_spec) {
1.64 parser 324: const char *old_spec_cstr=old_spec.cstr(String::UL_FILE_SPEC);
325: const char *new_spec_cstr=new_spec.cstr(String::UL_FILE_SPEC);
1.63 parser 326:
327: create_dir_for_file(new_spec);
328:
1.60 parser 329: if(rename(old_spec_cstr, new_spec_cstr)!=0)
1.73 parser 330: throw Exception(0, 0,
1.60 parser 331: &old_spec,
332: "rename failed: %s (%d), actual filename '%s' to '%s'",
333: strerror(errno), errno, old_spec_cstr, new_spec_cstr);
1.63 parser 334:
335: rmdir(old_spec, 1);
1.31 paf 336: }
337:
1.51 paf 338:
339: static bool entry_readable(const String& file_spec, bool need_dir) {
1.64 parser 340: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.51 paf 341: struct stat finfo;
342: if(access(fname, R_OK)==0 && stat(fname, &finfo)==0) {
1.73 parser 343: bool is_dir=finfo.st_mode&S_IFDIR != 0;
1.51 paf 344: return is_dir==need_dir;
345: }
346: return false;
347: }
1.31 paf 348: bool file_readable(const String& file_spec) {
1.51 paf 349: return entry_readable(file_spec, false);
350: }
351: bool dir_readable(const String& file_spec) {
352: return entry_readable(file_spec, true);
1.65 parser 353: }
354: String *file_readable(const String& path, const String& name) {
355: String *result=new(path.pool()) String(path);
356: *result << "/";
357: *result << name;
358: return file_readable(*result)?result:0;
1.43 paf 359: }
360: bool file_executable(const String& file_spec) {
1.64 parser 361: return access(file_spec.cstr(String::UL_FILE_SPEC), X_OK)==0;
1.44 paf 362: }
363:
1.64 parser 364: bool file_stat(const String& file_spec,
1.58 parser 365: size_t& rsize,
366: time_t& ratime,
367: time_t& rmtime,
1.64 parser 368: time_t& rctime,
369: bool fail_on_read_problem) {
1.44 paf 370: Pool& pool=file_spec.pool();
1.64 parser 371: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.44 paf 372: struct stat finfo;
373: if(stat(fname, &finfo)!=0)
1.64 parser 374: if(fail_on_read_problem)
1.73 parser 375: throw Exception(0, 0,
1.67 parser 376: &file_spec,
377: "getting file size failed: %s (%d), real filename '%s'",
378: strerror(errno), errno, fname);
1.64 parser 379: else
380: return false;
1.58 parser 381: rsize=finfo.st_size;
382: ratime=finfo.st_atime;
383: rmtime=finfo.st_mtime;
384: rctime=finfo.st_ctime;
1.64 parser 385: return true;
1.18 paf 386: }
387:
1.8 paf 388: char *getrow(char **row_ref, char delim) {
389: char *result=*row_ref;
390: if(result) {
391: *row_ref=strchr(result, delim);
392: if(*row_ref)
393: *((*row_ref)++)=0;
394: else if(!*result)
395: return 0;
396: }
397: return result;
398: }
399:
1.23 paf 400: char *lsplit(char *string, char delim) {
401: if(string) {
402: char *v=strchr(string, delim);
1.8 paf 403: if(v) {
404: *v=0;
405: return v+1;
406: }
407: }
408: return 0;
409: }
410:
411: char *lsplit(char **string_ref, char delim) {
412: char *result=*string_ref;
413: char *next=lsplit(*string_ref, delim);
414: *string_ref=next;
415: return result;
1.9 paf 416: }
417:
418: char *rsplit(char *string, char delim) {
1.18 paf 419: if(string) {
1.9 paf 420: char *v=strrchr(string, delim);
1.18 paf 421: if(v) {
1.9 paf 422: *v=0;
423: return v+1;
424: }
425: }
426: return NULL;
1.10 paf 427: }
428:
1.37 paf 429: /// @todo less stupid type detection
1.10 paf 430: char *format(Pool& pool, double value, char *fmt) {
1.78 paf 431: char *result=(char *)pool.malloc(MAX_NUMBER, 4);
1.10 paf 432: if(fmt)
433: if(strpbrk(fmt, "diouxX"))
434: if(strpbrk(fmt, "ouxX"))
1.33 paf 435: snprintf(result, MAX_NUMBER, fmt, (uint)value );
1.10 paf 436: else
1.33 paf 437: snprintf(result, MAX_NUMBER, fmt, (int)value );
1.10 paf 438: else
439: snprintf(result, MAX_NUMBER, fmt, value);
440: else
1.33 paf 441: snprintf(result, MAX_NUMBER, "%d", (int)value);
1.10 paf 442:
443: return result;
1.12 paf 444: }
445:
1.36 paf 446: size_t stdout_write(const void *buf, size_t size) {
1.12 paf 447: #ifdef WIN32
448: do{
449: int chunk_written=fwrite(buf, 1, min(8*0x400, size), stdout);
450: if(chunk_written<=0)
451: break;
452: size-=chunk_written;
1.36 paf 453: buf=((const char*)buf)+chunk_written;
1.12 paf 454: } while(size>0);
455:
456: return size;
457: #else
1.13 paf 458: return fwrite(buf, 1, size, stdout);
1.12 paf 459: #endif
1.2 paf 460: }
1.14 paf 461:
1.77 parser 462: char *unescape_chars(Pool& pool, const char *cp, int len) {
1.78 paf 463: char *s=(char *)pool.malloc(len + 1, 5);
1.14 paf 464: enum EscapeState {
1.33 paf 465: EscapeRest,
466: EscapeFirst,
1.14 paf 467: EscapeSecond
468: } escapeState=EscapeRest;
469: int escapedValue=0;
470: int srcPos=0;
471: int dstPos=0;
472: while(srcPos < len) {
473: int ch=cp[srcPos];
474: switch(escapeState) {
475: case EscapeRest:
476: if(ch=='%') {
477: escapeState=EscapeFirst;
478: } else if(ch=='+') {
479: s[dstPos++]=' ';
480: } else {
481: s[dstPos++]=ch;
482: }
483: break;
484: case EscapeFirst:
485: escapedValue=hex_value[ch] << 4;
486: escapeState=EscapeSecond;
487: break;
488: case EscapeSecond:
489: escapedValue +=hex_value[ch];
490: s[dstPos++]=escapedValue;
491: escapeState=EscapeRest;
492: break;
493: }
494: srcPos++;
495: }
496: s[dstPos]=0;
497: return s;
498: }
499:
1.52 paf 500: /// used by attributed_meaning_to_string / append_attribute_subattribute
1.40 paf 501: struct Attributed_meaning_info {
1.52 paf 502: String *header; // header line being constructed
503: String::Untaint_lang lang; // language in which to append to that line
1.40 paf 504: };
1.17 paf 505: static void append_attribute_subattribute(const Hash::Key& akey, Hash::Val *avalue,
1.14 paf 506: void *info) {
507: if(akey==VALUE_NAME)
508: return;
509:
1.40 paf 510: Attributed_meaning_info& ami=*static_cast<Attributed_meaning_info *>(info);
511:
1.14 paf 512: // ...; charset=windows1251
1.48 paf 513: *ami.header << "; ";
1.70 parser 514: ami.header->append(akey, ami.lang);
1.48 paf 515: *ami.header << "=";
1.70 parser 516: ami.header->append(static_cast<Value *>(avalue)->as_string(), ami.lang);
1.14 paf 517: }
1.49 paf 518: const String& attributed_meaning_to_string(Value& meaning,
519: String::Untaint_lang lang) {
1.20 paf 520: String &result=*new(meaning.pool()) String(meaning.pool());
1.75 parser 521: if(Hash *hash=meaning.get_hash(0)) {
1.14 paf 522: // $value(value) $subattribute(subattribute value)
523: if(Value *value=static_cast<Value *>(hash->get(*value_name)))
1.40 paf 524: result.append(value->as_string(), lang, true);
1.14 paf 525:
1.40 paf 526: Attributed_meaning_info attributed_meaning_info={
1.52 paf 527: &result,
528: lang
1.40 paf 529: };
530: hash->for_each(append_attribute_subattribute, &attributed_meaning_info);
1.14 paf 531: } else // result value
1.40 paf 532: result.append(meaning.as_string(), lang, true);
1.14 paf 533:
534: return result;
1.24 paf 535: }
536:
537: #ifdef WIN32
538: void back_slashes_to_slashes(char *s) {
539: if(s)
540: for(; *s; s++)
541: if(*s=='\\')
542: *s='/';
543: }
1.42 paf 544: /*
545: void slashes_to_back_slashes(char *s) {
546: if(s)
547: for(; *s; s++)
548: if(*s=='/')
549: *s='\\';
550: }
551: */
1.24 paf 552: #endif
1.41 paf 553:
554: bool StrEqNc(const char *s1, const char *s2, bool strict) {
555: while(true) {
556: if(!(*s1)) {
557: if(!(*s2))
558: return true;
559: else
560: return !strict;
561: } else if(!(*s2))
562: return !strict;
563: if(isalpha(*s1)) {
564: if(tolower(*s1) !=tolower(*s2))
565: return false;
566: } else if((*s1) !=(*s2))
567: return false;
568: s1++;
569: s2++;
570: }
1.57 parser 571: }
572:
1.84 paf 573: static bool isLeap(int year) {
1.57 parser 574: return !(
575: (year % 4) || ((year % 400) && !(year % 100))
576: );
577: }
578:
579: int getMonthDays(int year, int month) {
580: int monthDays[]={
581: 31,
582: isLeap(year) ? 29 : 28,
583: 31,
584: 30,
585: 31,
586: 30,
587: 31,
588: 31,
589: 30,
590: 31,
591: 30,
592: 31
593: };
594: return monthDays[month];
1.41 paf 595: }
1.69 parser 596:
597: void remove_crlf(char *start, char *end) {
598: for(char *p=start; p<end; p++)
599: switch(*p) {
600: case '\n': *p='|'; break;
601: case '\r': *p=' '; break;
602: }
1.91 paf 603: }
604:
605:
606: /// must be last in this file
607: #undef vsnprintf
608: int __vsnprintf(char *b, size_t s, const char *f, va_list l) {
609: if(!s)
610: return 0;
611:
612: int r;
613: // note: on win32& maybe somewhere else
614: // vsnprintf do not writes terminating 0 in 'buffer full' case, reducing
615: --s;
616: #if _MSC_VER
617: /*
618: win32:
619: mk:@MSITStore:C:\Program%20Files\Microsoft%20Visual%20Studio\MSDN\2001APR\1033\vccore.chm::/html/_crt__vsnprintf.2c_._vsnwprintf.htm
620:
621: if the number of bytes to write exceeds buffer, then count bytes are written and –1 is returned
622: */
623: r=_vsnprintf(b, s, f, l);
624: if(r<0)
625: r=s;
626: #else
627: r=vsnprintf(b, s, f, l);
628: /*
629: solaris:
630: man vsnprintf
631:
632: The snprintf() function returns the number of characters
633: formatted, that is, the number of characters that would have
634: been written to the buffer if it were large enough. If the
635: value of n is 0 on a call to snprintf(), an unspecified
636: value less than 1 is returned.
637: */
638:
639: if(r<0)
640: r=0;
641: else if(r>s)
642: r=s;
643: #endif
644: b[r]=0;
645: return r;
646: }
647:
648: int __snprintf(char *b, size_t s, const char *f, ...) {
649: va_list l;
650: va_start(l, f);
651: int r=__vsnprintf(b, s, f, l);
652: va_end(l);
653: return r;
1.98 ! paf 654: }
! 655:
! 656: int pa_sleep(unsigned long secs, unsigned long usecs) {
! 657: for (; usecs >= 1000000; ++secs, usecs -= 1000000);
! 658:
! 659: #ifdef WIN32
! 660: Sleep(secs * 1000 + usecs / 1000);
! 661: return 0;
! 662: #else
! 663: struct timeval t;
! 664: t.tv_sec = secs;
! 665: t.tv_usec = usecs;
! 666: return (select(0, NULL, NULL, NULL, &t) == -1 ? errno : 0);
! 667: #endif
1.74 parser 668: }
E-mail: