Annotation of parser3/src/main/pa_common.C, revision 1.78
1.15 paf 1: /** @file
1.16 paf 2: Parser: commonly functions.
3:
1.8 paf 4: Copyright(c) 2001 ArtLebedev Group(http://www.artlebedev.com)
1.68 parser 5: Author: Alexander Petrosyan <paf@design.ru>(http://design.ru/paf)
1.16 paf 6:
1.78 ! paf 7: $Id: pa_common.C,v 1.77 2001/10/24 16:33:02 parser Exp $
1.1 paf 8: */
9:
10: #include "pa_common.h"
1.2 paf 11: #include "pa_types.h"
1.4 paf 12: #include "pa_exception.h"
1.14 paf 13: #include "pa_pool.h"
14: #include "pa_globals.h"
15: #include "pa_value.h"
16: #include "pa_hash.h"
17: #include "pa_string.h"
1.1 paf 18:
1.47 paf 19: #ifndef WIN32
20: # ifndef _O_TEXT
21: # define _O_TEXT 0
22: # endif
23: # ifndef _O_BINARY
24: # define _O_BINARY 0
25: # endif
26: #endif
27:
1.22 paf 28: #if _MSC_VER
1.1 paf 29:
30: int __vsnprintf(char *b, size_t s, const char *f, va_list l) {
31: int r=_vsnprintf(b, --s, f, l);
32: b[s]=0;
33: return r;
34: }
35: int __snprintf(char *b, size_t s, const char *f, ...) {
36: va_list l;
37: va_start(l, f);
38: int r=__vsnprintf(b, s, f, l);
39: va_end(l);
40: return r;
41: }
42:
43: #endif
1.2 paf 44:
1.76 parser 45: void fix_line_breaks(char *src, size_t& size) {
1.72 parser 46: char *dest=src;
47: // fix DOS: \r\n -> \n
48: // fix Macintosh: \r -> \n
49: char *bol=src;
50: while(char *eol=strchr(bol, '\r')) {
51: size_t len=eol-bol;
52: if(dest!=bol)
53: memcpy(dest, bol, len);
54: dest+=len;
55: *dest++='\n';
56:
57: if(eol[1]=='\n') { // \r,\n = DOS
58: bol=eol+2;
59: size--;
60: } else // \r,not \n = Macintosh
61: bol=eol+1;
62: }
63: // last piece without \r, including terminating 0
64: if(dest!=bol)
65: strcpy(dest, bol);
66: }
1.18 paf 67:
1.28 paf 68: char *file_read_text(Pool& pool, const String& file_spec, bool fail_on_read_problem) {
1.72 parser 69: void *result; size_t size;
70: return file_read(pool, file_spec, result, size, true, fail_on_read_problem)?(char *)result:0;
1.34 paf 71: }
72: bool file_read(Pool& pool, const String& file_spec,
1.44 paf 73: void*& data, size_t& read_size, bool as_text,
74: bool fail_on_read_problem,
75: size_t offset, size_t limit) {
1.64 parser 76: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.62 parser 77: //printf("file_read(%s)\n", fname);
1.33 paf 78: int f;
1.2 paf 79: struct stat finfo;
1.33 paf 80:
81: // first open, next stat:
1.45 paf 82: // directory update of NTFS hard links performed on open.
1.33 paf 83: // ex:
84: // a.html:^test[] and b.html hardlink to a.html
85: // user inserts ! before ^test in a.html
86: // directory entry of b.html in NTFS not updated at once,
1.35 paf 87: // they delay update till open, so we would receive "!^test[" string
88: // if would do stat, next open.
1.34 paf 89: if(
1.72 parser 90: (f=open(fname, O_RDONLY|(as_text?_O_BINARY/*_O_TEXT*/:_O_BINARY)))>=0 &&
1.34 paf 91: stat(fname, &finfo)==0) {
1.2 paf 92: /*if(exclusive)
93: flock(f, LOCK_EX);*/
1.44 paf 94: size_t max_size=limit?min(offset+limit, finfo.st_size)-offset:finfo.st_size;
1.47 paf 95: if(!max_size) { // eof
96: data=0;
97: read_size=0;
1.59 parser 98: } else {
1.78 ! paf 99: data=pool.malloc(max_size+(as_text?1:0), 3);
1.59 parser 100: if(offset)
101: lseek(f, offset, SEEK_SET);
102: read_size=read(f, data, max_size);
1.47 paf 103: }
1.2 paf 104: /*if(exclusive)
105: flock(f, LOCK_UN);*/
106: close(f);
1.59 parser 107: if(!max_size) // eof
108: return true;
1.32 paf 109:
1.44 paf 110: if(read_size>=0 && read_size<=max_size) {
1.34 paf 111: if(as_text)
1.46 paf 112: ((char*&)data)[read_size]=0;
1.34 paf 113: } else
1.73 parser 114: throw Exception(0, 0,
1.33 paf 115: &file_spec,
1.44 paf 116: "read failed: actually read %d bytes count not in [0..%lu] valid range",
117: read_size, (unsigned long)max_size); //never
1.32 paf 118:
1.72 parser 119: if(as_text)
120: fix_line_breaks((char *)data, read_size);
121: return true;
1.2 paf 122: }
1.4 paf 123: if(fail_on_read_problem)
1.73 parser 124: throw Exception(0, 0,
1.33 paf 125: &file_spec,
1.54 parser 126: "read failed: %s (%d), actual filename '%s'",
127: strerror(errno), errno, fname);
1.34 paf 128: return false;
1.8 paf 129: }
130:
1.63 parser 131: static void create_dir_for_file(const String& file_spec) {
132: size_t pos_after=1;
133: int pos_before;
134: while((pos_before=file_spec.pos("/", 1, pos_after))>=0) {
1.64 parser 135: mkdir(file_spec.mid(0, pos_before).cstr(String::UL_FILE_SPEC), 0775);
1.63 parser 136: pos_after=pos_before+1;
137: }
138: }
139:
1.18 paf 140: void file_write(Pool& pool,
1.28 paf 141: const String& file_spec,
1.34 paf 142: const void *data, size_t size,
1.33 paf 143: bool as_text/*,
1.20 paf 144: bool exclusive*/) {
1.64 parser 145: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.28 paf 146: int f;
1.50 paf 147: if(access(fname, W_OK)!=0) {/*no*/
1.63 parser 148: create_dir_for_file(file_spec);
1.50 paf 149:
1.33 paf 150: if((f=open(fname, O_WRONLY|O_CREAT|_O_BINARY, 0666))>0)
1.28 paf 151: close(f);
152: }
153: if(access(fname, R_OK|W_OK)==0) {
1.34 paf 154: int mode=O_RDWR|(as_text?_O_TEXT:_O_BINARY)
1.18 paf 155: #ifdef WIN32
1.28 paf 156: |O_TRUNC
1.18 paf 157: #endif
1.28 paf 158: ;
1.33 paf 159: if((f=open(fname, mode, 0666))>=0) {
1.28 paf 160: /*if(exclusive)
161: flock(f, LOCK_EX);*/
162:
1.33 paf 163: if(size) write(f, data, size);
1.18 paf 164: #ifndef WIN32
1.33 paf 165: ftruncate(f, size);
1.18 paf 166: #endif
1.28 paf 167: /*if(exclusive)
168: flock(f, LOCK_UN);*/
169: close(f);
170: return;
1.18 paf 171: }
172: }
1.73 parser 173: throw Exception(0, 0,
1.33 paf 174: &file_spec,
1.54 parser 175: "write failed: %s (%d), actual filename '%s'",
176: strerror(errno), errno, fname);
1.30 paf 177: }
178:
1.63 parser 179: // throws nothing! [this is required in file_move & file_delete]
1.50 paf 180: static void rmdir(const String& file_spec, size_t pos_after) {
181: int pos_before;
182: if((pos_before=file_spec.pos("/", 1, pos_after))>=0)
183: rmdir(file_spec, pos_before+1);
184:
1.64 parser 185: rmdir(file_spec.mid(0, pos_after-1/* / */).cstr(String::UL_FILE_SPEC));
1.50 paf 186: }
1.30 paf 187: void file_delete(Pool& pool, const String& file_spec) {
1.64 parser 188: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.54 parser 189: if(unlink(fname)!=0)
1.73 parser 190: throw Exception(0, 0,
1.33 paf 191: &file_spec,
1.54 parser 192: "unlink failed: %s (%d), actual filename '%s'",
193: strerror(errno), errno, fname);
1.50 paf 194:
195: rmdir(file_spec, 1);
1.60 parser 196: }
197: void file_move(Pool& pool, const String& old_spec, const String& new_spec) {
1.64 parser 198: const char *old_spec_cstr=old_spec.cstr(String::UL_FILE_SPEC);
199: const char *new_spec_cstr=new_spec.cstr(String::UL_FILE_SPEC);
1.63 parser 200:
201: create_dir_for_file(new_spec);
202:
1.60 parser 203: if(rename(old_spec_cstr, new_spec_cstr)!=0)
1.73 parser 204: throw Exception(0, 0,
1.60 parser 205: &old_spec,
206: "rename failed: %s (%d), actual filename '%s' to '%s'",
207: strerror(errno), errno, old_spec_cstr, new_spec_cstr);
1.63 parser 208:
209: rmdir(old_spec, 1);
1.31 paf 210: }
211:
1.51 paf 212:
213: static bool entry_readable(const String& file_spec, bool need_dir) {
1.64 parser 214: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.51 paf 215: struct stat finfo;
216: if(access(fname, R_OK)==0 && stat(fname, &finfo)==0) {
1.73 parser 217: bool is_dir=finfo.st_mode&S_IFDIR != 0;
1.51 paf 218: return is_dir==need_dir;
219: }
220: return false;
221: }
1.31 paf 222: bool file_readable(const String& file_spec) {
1.51 paf 223: return entry_readable(file_spec, false);
224: }
225: bool dir_readable(const String& file_spec) {
226: return entry_readable(file_spec, true);
1.65 parser 227: }
228: String *file_readable(const String& path, const String& name) {
229: String *result=new(path.pool()) String(path);
230: *result << "/";
231: *result << name;
232: return file_readable(*result)?result:0;
1.43 paf 233: }
234: bool file_executable(const String& file_spec) {
1.64 parser 235: return access(file_spec.cstr(String::UL_FILE_SPEC), X_OK)==0;
1.44 paf 236: }
237:
1.64 parser 238: bool file_stat(const String& file_spec,
1.58 parser 239: size_t& rsize,
240: time_t& ratime,
241: time_t& rmtime,
1.64 parser 242: time_t& rctime,
243: bool fail_on_read_problem) {
1.44 paf 244: Pool& pool=file_spec.pool();
1.64 parser 245: const char *fname=file_spec.cstr(String::UL_FILE_SPEC);
1.44 paf 246: struct stat finfo;
247: if(stat(fname, &finfo)!=0)
1.64 parser 248: if(fail_on_read_problem)
1.73 parser 249: throw Exception(0, 0,
1.67 parser 250: &file_spec,
251: "getting file size failed: %s (%d), real filename '%s'",
252: strerror(errno), errno, fname);
1.64 parser 253: else
254: return false;
1.58 parser 255: rsize=finfo.st_size;
256: ratime=finfo.st_atime;
257: rmtime=finfo.st_mtime;
258: rctime=finfo.st_ctime;
1.64 parser 259: return true;
1.18 paf 260: }
261:
1.8 paf 262: char *getrow(char **row_ref, char delim) {
263: char *result=*row_ref;
264: if(result) {
265: *row_ref=strchr(result, delim);
266: if(*row_ref)
267: *((*row_ref)++)=0;
268: else if(!*result)
269: return 0;
270: }
271: return result;
272: }
273:
1.23 paf 274: char *lsplit(char *string, char delim) {
275: if(string) {
276: char *v=strchr(string, delim);
1.8 paf 277: if(v) {
278: *v=0;
279: return v+1;
280: }
281: }
282: return 0;
283: }
284:
285: char *lsplit(char **string_ref, char delim) {
286: char *result=*string_ref;
287: char *next=lsplit(*string_ref, delim);
288: *string_ref=next;
289: return result;
1.9 paf 290: }
291:
292: char *rsplit(char *string, char delim) {
1.18 paf 293: if(string) {
1.9 paf 294: char *v=strrchr(string, delim);
1.18 paf 295: if(v) {
1.9 paf 296: *v=0;
297: return v+1;
298: }
299: }
300: return NULL;
1.10 paf 301: }
302:
1.37 paf 303: /// @todo less stupid type detection
1.10 paf 304: char *format(Pool& pool, double value, char *fmt) {
1.78 ! paf 305: char *result=(char *)pool.malloc(MAX_NUMBER, 4);
1.10 paf 306: if(fmt)
307: if(strpbrk(fmt, "diouxX"))
308: if(strpbrk(fmt, "ouxX"))
1.33 paf 309: snprintf(result, MAX_NUMBER, fmt, (uint)value );
1.10 paf 310: else
1.33 paf 311: snprintf(result, MAX_NUMBER, fmt, (int)value );
1.10 paf 312: else
313: snprintf(result, MAX_NUMBER, fmt, value);
314: else
1.33 paf 315: snprintf(result, MAX_NUMBER, "%d", (int)value);
1.10 paf 316:
317: return result;
1.12 paf 318: }
319:
1.36 paf 320: size_t stdout_write(const void *buf, size_t size) {
1.12 paf 321: #ifdef WIN32
322: do{
323: int chunk_written=fwrite(buf, 1, min(8*0x400, size), stdout);
324: if(chunk_written<=0)
325: break;
326: size-=chunk_written;
1.36 paf 327: buf=((const char*)buf)+chunk_written;
1.12 paf 328: } while(size>0);
329:
330: return size;
331: #else
1.13 paf 332: return fwrite(buf, 1, size, stdout);
1.12 paf 333: #endif
1.2 paf 334: }
1.14 paf 335:
1.77 parser 336: char *unescape_chars(Pool& pool, const char *cp, int len) {
1.78 ! paf 337: char *s=(char *)pool.malloc(len + 1, 5);
1.14 paf 338: enum EscapeState {
1.33 paf 339: EscapeRest,
340: EscapeFirst,
1.14 paf 341: EscapeSecond
342: } escapeState=EscapeRest;
343: int escapedValue=0;
344: int srcPos=0;
345: int dstPos=0;
346: while(srcPos < len) {
347: int ch=cp[srcPos];
348: switch(escapeState) {
349: case EscapeRest:
350: if(ch=='%') {
351: escapeState=EscapeFirst;
352: } else if(ch=='+') {
353: s[dstPos++]=' ';
354: } else {
355: s[dstPos++]=ch;
356: }
357: break;
358: case EscapeFirst:
359: escapedValue=hex_value[ch] << 4;
360: escapeState=EscapeSecond;
361: break;
362: case EscapeSecond:
363: escapedValue +=hex_value[ch];
364: s[dstPos++]=escapedValue;
365: escapeState=EscapeRest;
366: break;
367: }
368: srcPos++;
369: }
370: s[dstPos]=0;
371: return s;
372: }
373:
1.52 paf 374: /// used by attributed_meaning_to_string / append_attribute_subattribute
1.40 paf 375: struct Attributed_meaning_info {
1.52 paf 376: String *header; // header line being constructed
377: String::Untaint_lang lang; // language in which to append to that line
1.40 paf 378: };
1.17 paf 379: static void append_attribute_subattribute(const Hash::Key& akey, Hash::Val *avalue,
1.14 paf 380: void *info) {
381: if(akey==VALUE_NAME)
382: return;
383:
1.40 paf 384: Attributed_meaning_info& ami=*static_cast<Attributed_meaning_info *>(info);
385:
1.14 paf 386: // ...; charset=windows1251
1.48 paf 387: *ami.header << "; ";
1.70 parser 388: ami.header->append(akey, ami.lang);
1.48 paf 389: *ami.header << "=";
1.70 parser 390: ami.header->append(static_cast<Value *>(avalue)->as_string(), ami.lang);
1.14 paf 391: }
1.49 paf 392: const String& attributed_meaning_to_string(Value& meaning,
393: String::Untaint_lang lang) {
1.20 paf 394: String &result=*new(meaning.pool()) String(meaning.pool());
1.75 parser 395: if(Hash *hash=meaning.get_hash(0)) {
1.14 paf 396: // $value(value) $subattribute(subattribute value)
397: if(Value *value=static_cast<Value *>(hash->get(*value_name)))
1.40 paf 398: result.append(value->as_string(), lang, true);
1.14 paf 399:
1.40 paf 400: Attributed_meaning_info attributed_meaning_info={
1.52 paf 401: &result,
402: lang
1.40 paf 403: };
404: hash->for_each(append_attribute_subattribute, &attributed_meaning_info);
1.14 paf 405: } else // result value
1.40 paf 406: result.append(meaning.as_string(), lang, true);
1.14 paf 407:
408: return result;
1.24 paf 409: }
410:
411: #ifdef WIN32
412: void back_slashes_to_slashes(char *s) {
413: if(s)
414: for(; *s; s++)
415: if(*s=='\\')
416: *s='/';
417: }
1.42 paf 418: /*
419: void slashes_to_back_slashes(char *s) {
420: if(s)
421: for(; *s; s++)
422: if(*s=='/')
423: *s='\\';
424: }
425: */
1.24 paf 426: #endif
1.41 paf 427:
428: bool StrEqNc(const char *s1, const char *s2, bool strict) {
429: while(true) {
430: if(!(*s1)) {
431: if(!(*s2))
432: return true;
433: else
434: return !strict;
435: } else if(!(*s2))
436: return !strict;
437: if(isalpha(*s1)) {
438: if(tolower(*s1) !=tolower(*s2))
439: return false;
440: } else if((*s1) !=(*s2))
441: return false;
442: s1++;
443: s2++;
444: }
1.57 parser 445: }
446:
447: static int isLeap(int year) {
448: return !(
449: (year % 4) || ((year % 400) && !(year % 100))
450: );
451: }
452:
453: int getMonthDays(int year, int month) {
454: int monthDays[]={
455: 31,
456: isLeap(year) ? 29 : 28,
457: 31,
458: 30,
459: 31,
460: 30,
461: 31,
462: 31,
463: 30,
464: 31,
465: 30,
466: 31
467: };
468: return monthDays[month];
1.41 paf 469: }
1.69 parser 470:
471: void remove_crlf(char *start, char *end) {
472: for(char *p=start; p<end; p++)
473: switch(*p) {
474: case '\n': *p='|'; break;
475: case '\r': *p=' '; break;
476: }
1.74 parser 477: }
E-mail: