--- parser3/src/include/pa_common.h 2004/03/05 11:38:12 1.99 +++ parser3/src/include/pa_common.h 2013/07/16 14:55:45 1.151 @@ -1,20 +1,67 @@ /** @file Parser: commonly used functions. - Copyright (c) 2001-2004 ArtLebedev Group (http://www.artlebedev.com) + Copyright (c) 2001-2012 Art. Lebedev Studio (http://www.artlebedev.com) Author: Alexandr Petrosian (http://paf.design.ru) */ #ifndef PA_COMMON_H #define PA_COMMON_H -static const char * const IDENT_COMMON_H="$Date: 2004/03/05 11:38:12 $"; +#define IDENT_PA_COMMON_H "$Id: pa_common.h,v 1.151 2013/07/16 14:55:45 moko Exp $" #include "pa_string.h" #include "pa_hash.h" +class Request; + +// defines +#define HTTP_USER_AGENT "user-agent" + +#define HTTP_STATUS "status" +#define HTTP_STATUS_CAPITALIZED "Status" + +#define HTTP_CONTENT_LENGTH "content-length" +#define HTTP_CONTENT_LENGTH_CAPITALIZED "Content-Length" + +#define HTTP_CONTENT_TYPE "content-type" +#define HTTP_CONTENT_TYPE_UPPER "CONTENT-TYPE" +#define HTTP_CONTENT_TYPE_CAPITALIZED "Content-Type" +#define HTTP_CONTENT_TYPE_FORM_URLENCODED "application/x-www-form-urlencoded" +#define HTTP_CONTENT_TYPE_MULTIPART_FORMDATA "multipart/form-data" +#define HTTP_CONTENT_TYPE_MULTIPART_RELATED "multipart/related" +#define HTTP_CONTENT_TYPE_MULTIPART_MIXED "multipart/mixed" + +#define CONTENT_TRANSFER_ENCODING_NAME "content-transfer-encoding" +#define CONTENT_TRANSFER_ENCODING_CAPITALIZED "Content-Transfer-Encoding" + +#define CONTENT_DISPOSITION "content-disposition" +#define CONTENT_DISPOSITION_CAPITALIZED "Content-Disposition" +#define CONTENT_DISPOSITION_ATTACHMENT "attachment" +#define CONTENT_DISPOSITION_INLINE "inline" +#define CONTENT_DISPOSITION_FILENAME_NAME "filename" + +#define BASE64_STRICT_OPTION_NAME "strict" + +const String http_content_type(HTTP_CONTENT_TYPE); + +const String content_transfer_encoding_name(CONTENT_TRANSFER_ENCODING_NAME); + +const String content_disposition(CONTENT_DISPOSITION); +const String content_disposition_inline(CONTENT_DISPOSITION_INLINE); +const String content_disposition_attachment(CONTENT_DISPOSITION_ATTACHMENT); +const String content_disposition_filename_name(CONTENT_DISPOSITION_FILENAME_NAME); + + +#define HASH_ORDER + +#ifdef HASH_ORDER +#undef PA_HASH_CLASS +#include "pa_hash.h" +#endif + class Value; -typedef Hash HashStringValue; +typedef HASH_STRING HashStringValue; // replace system s*nprintf with our versions #undef vsnprintf @@ -56,24 +103,28 @@ inline long lseek( int handle, long offs #endif +const char* capitalize(const char* s); + /** under WIN32 "t" mode fixes DOS chars OK, can't say that about other systems/ line break styles */ void fix_line_breaks( - char *str, - size_t& length///< may change! used to speedup next actions - ); + char *str, + size_t& length///< may change! used to speedup next actions + ); int pa_lock_shared_blocking(int fd); int pa_lock_exclusive_blocking(int fd); int pa_lock_exclusive_nonblocking(int fd); int pa_unlock(int fd); +void create_dir_for_file(const String& file_spec); + typedef void (*File_read_action)( - struct stat& finfo, - int f, - const String& file_spec, const char* fname, bool as_text, - void *context); + struct stat& finfo, + int f, + const String& file_spec, const char* fname, bool as_text, + void *context); /** shared-lock specified file, @@ -86,18 +137,24 @@ bool file_read_action_under_lock(const S const char* action_name, File_read_action action, void *context, bool as_text=false, bool fail_on_read_problem=true); + /** read specified text file using if fail_on_read_problem is true[default] throws an exception WARNING: charset is used for http header case conversion, it's not a charset of input file! - - @returns true if read OK */ char *file_read_text(Request_charsets& charsets, - const String& file_spec, - bool fail_on_read_problem=true, - HashStringValue* options=0/*, HashStringValue* * out_fields=0*/); + const String& file_spec, + bool fail_on_read_problem=true, + HashStringValue* options=0, + bool transcode_result=true); + +char *file_load_text(Request& r, + const String& file_spec, + bool fail_on_read_problem=true, + HashStringValue* options=0, + bool transcode_result=true); struct File_read_result { bool success; @@ -110,14 +167,20 @@ struct File_read_result { if fail_on_read_problem is true[default] throws an exception WARNING: charset is used for http header case conversion, it's not a charset of input file! - - @returns true if read OK */ -File_read_result file_read(Request_charsets& charsets, - const String& file_spec, - bool as_text, - HashStringValue* options=0, - bool fail_on_read_problem=true); +File_read_result file_read(Request_charsets& charsets, + const String& file_spec, + bool as_text, + HashStringValue* options=0, + bool fail_on_read_problem=true, + char* buf=0, size_t offset=0, size_t size=0, bool transcode_text_result=true); + +File_read_result file_load(Request& r, + const String& file_spec, + bool as_text, + HashStringValue* options=0, + bool fail_on_read_problem=true, + char* buf=0, size_t offset=0, size_t size=0, bool transcode_text_result=true); typedef void (*File_write_action)(int f, void *context); @@ -131,7 +194,9 @@ typedef void (*File_write_action)(int f, */ bool file_write_action_under_lock( const String& file_spec, - const char* action_name, File_write_action action, void *context, + const char* action_name, + File_write_action action, + void *context, bool as_text=false, bool do_append=false, bool do_block=true, @@ -142,35 +207,38 @@ bool file_write_action_under_lock( throws an exception in case of problems */ void file_write( + Request_charsets& charsets, const String& file_spec, - const char* data, size_t size, + const char* data, + size_t size, bool as_text, - bool do_append=false); + bool do_append=false, + Charset* asked_charset=0); /** delete specified file throws an exception in case of problems */ -bool file_delete(const String& file_spec, bool fail_on_problem=true); +bool file_delete(const String& file_spec, bool fail_on_problem=true, bool keep_empty_dirs=false); /** move specified file throws an exception in case of problems */ -void file_move(const String& old_spec, const String& new_spec); +void file_move(const String& old_spec, const String& new_spec, bool keep_empty_dirs=false); bool entry_exists(const char* fname, struct stat *afinfo=0); bool entry_exists(const String& file_spec); -bool file_readable(const String& file_spec); -bool dir_readable(const String& file_spec); -const String* file_readable(const String& path, const String& name); +bool file_exist(const String& file_spec); +bool dir_exists(const String& file_spec); +const String* file_exist(const String& path, const String& name); bool file_executable(const String& file_spec); bool file_stat(const String& file_spec, - size_t& rsize, - time_t& ratime, - time_t& rmtime, - time_t& rctime, - bool fail_on_read_problem=true); + size_t& rsize, + time_t& ratime, + time_t& rmtime, + time_t& rctime, + bool fail_on_read_problem=true); /** scans for @a delim[default \n] in @a *row_ref, @@ -182,11 +250,13 @@ char *getrow(char **row_ref,char delim=' char *lsplit(char *string, char delim); char *lsplit(char **string_ref,char delim); char *rsplit(char *string, char delim); -const char* format(double value, char *fmt); +const char* format(double value, const char *fmt); size_t stdout_write(const void *buf, size_t size); -char *unescape_chars(const char* cp, int len); +char* unescape_chars(const char* cp, int len, Charset* client_charset=0, bool js=false/*true==decode \uXXXX and don't convert '+' to space*/); + +char *search_stop(char*& current, char cstop_at); #ifdef WIN32 void back_slashes_to_slashes(char *s); @@ -198,21 +268,150 @@ void back_slashes_to_slashes(char *s); qsort(names,cnt,sizeof_names,func_addr) #endif -bool StrEqNc(const char* s1, const char* s2, bool strict=true); +bool StrStartFromNC(const char* str, const char* substr, bool equal=false); +size_t strpos(const char *str, const char *substr); + +Charset* detect_charset(const char* content_type); #define SECS_PER_DAY (60*60*24) int getMonthDays(int year, int month); -void remove_crlf(char *start, char *end); +int remove_crlf(char *start, char *end); + +inline bool pa_isalpha(unsigned char c) { + return (((c>='A') && (c<='Z')) || ((c>='a') && (c<='z'))); +} + +inline bool pa_isalnum(unsigned char c) { + return (((c>='0') && (c<='9')) || pa_isalpha(c)); +} -#ifdef PA_SAFE_MODE void check_safe_mode(struct stat finfo, const String& file_spec, const char* fname); -#endif -char* pa_base64(const char *in, size_t len); +void pa_base64_decode(const char *in, size_t in_size, char*& result, size_t& result_size, bool strict=false); +char* pa_base64_encode(const char *in, size_t in_size); +struct File_base64_action_info { + unsigned char** base64; +}; +char* pa_base64_encode(const String& file_spec); +static void file_base64_file_action( + struct stat& finfo, + int f, + const String&, const char* /*fname*/, bool, + void *context); + +#define FILE_BUFFER_SIZE 4096 +static unsigned long crc32Table[256]; +static void InitCrc32Table() +{ + if(crc32Table[1] == 0){ + // This is the official polynomial used by CRC32 in PKZip. + // Often times the polynomial shown reversed as 0x04C11DB7. + static const unsigned long dwPolynomial = 0xEDB88320; + + for(int i = 0; i < 256; i++) + { + unsigned long dwCrc = i; + for(int j = 8; j > 0; j--) + { + if(dwCrc & 1) + dwCrc = (dwCrc >> 1) ^ dwPolynomial; + else + dwCrc >>= 1; + } + crc32Table[i] = dwCrc; + } + } +} + +int file_block_read(const int f, unsigned char* buffer, const size_t size); + +inline void CalcCrc32(const unsigned char byte, unsigned long &crc32) +{ + crc32 = ((crc32) >> 8) ^ crc32Table[(byte) ^ ((crc32) & 0x000000FF)]; +} + +const unsigned long pa_crc32(const char *in, size_t in_size); +const unsigned long pa_crc32(const String& file_spec); +static void file_crc32_file_action( + struct stat& finfo, + int f, + const String&, const char* /*fname*/, bool, + void *context); + +static const char* hex_string(unsigned char* bytes, size_t size, bool upcase) { + char *bytes_hex=new(PointerFreeGC) char [size*2/*byte->hh*/+1/*for zero-teminator*/]; + unsigned char *src=bytes; + unsigned char *end=bytes+size; + char *dest=bytes_hex; + + const char *hex=upcase?"0123456789ABCDEF":"0123456789abcdef"; + + for(; srcput(key, value); +} + +static void remove_key_from( + HashStringValue::key_type key, + HashStringValue::value_type /*value*/, + HashStringValue* dest) { + dest->remove(key); +} + +static String::C date_gmt_string(tm* tms) { + /// http://www.w3.org/Protocols/rfc2616/rfc2616-sec3.html#sec3.3 + static const char month_names[12][4]={ + "Jan","Feb","Mar","Apr","May","Jun","Jul","Aug","Sep","Oct","Nov","Dec"}; + static const char days[7][4]={ + "Sun","Mon","Tue","Wed","Thu","Fri","Sat"}; + + char *buf=new(PointerFreeGC) char[MAX_STRING]; + return String::C(buf, + snprintf(buf, MAX_STRING, "%s, %.2d %s %.4d %.2d:%.2d:%.2d GMT", + days[tms->tm_wday], + tms->tm_mday,month_names[tms->tm_mon],tms->tm_year+1900, + tms->tm_hour,tms->tm_min,tms->tm_sec)); +} // globals extern const String file_status_name; +// global defines for file options which are handled but not checked elsewhere, we check them + +#define PA_SQL_LIMIT_NAME "limit" +#define PA_SQL_OFFSET_NAME "offset" +#define PA_COLUMN_SEPARATOR_NAME "separator" +#define PA_COLUMN_ENCLOSER_NAME "encloser" +#define PA_CHARSET_NAME "charset" +#define PA_RESPONSE_CHARSET_NAME "response-charset" + +// globals defines for sql options + +#define SQL_BIND_NAME "bind" +#define SQL_DEFAULT_NAME "default" +#define SQL_DISTINCT_NAME "distinct" +#define SQL_VALUE_TYPE_NAME "type" + +#ifndef DOXYGEN +enum Table2hash_distint { D_ILLEGAL, D_FIRST }; +enum Table2hash_value_type { C_HASH, C_STRING, C_TABLE }; +#endif + #endif +