--- parser3/src/include/pa_string.h 2001/01/29 21:51:51 1.13 +++ parser3/src/include/pa_string.h 2001/03/14 08:50:01 1.35 @@ -1,17 +1,21 @@ /* - $Id: pa_string.h,v 1.13 2001/01/29 21:51:51 paf Exp $ + Parser + Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) + Author: Alexander Petrosyan (http://design.ru/paf) + + $Id: pa_string.h,v 1.35 2001/03/14 08:50:01 paf Exp $ */ /* String Chunk0 ====== ======== - head--------->[ptr, size] - append_here-------->[ptr, size] - link_row ........ - . . - . [ptr, size] - ...........>[link to the next chunk] + head--------------->[ptr, size, ...] + append_here-------->[ptr, size, ...] + . + . + [ptr, size, ...] + link_row----------->[link to the next chunk] */ @@ -19,50 +23,82 @@ #define PA_STRING_H #ifdef HAVE_CONFIG_H -#include "pa_config.h" +# include "pa_config.h" #endif #include +#include "pa_pool.h" #include "pa_types.h" -class Pool; +#define UNTAINT_TIMES_BIGGER 10 #ifndef NO_STRING_ORIGIN -# define STRING_APPEND_PARAMS const char *src, char *file, uint line -# define APPEND(src, file, line) real_append(src, file, line) +# define STRING_APPEND_PARAMS \ + const char *src, size_t size, \ + bool tainted, \ + const char *file, uint line +# define APPEND(src, size, file, line) real_append(src, size, false, file, line) +# define APPEND_TAINTED(src, size, file, line) real_append(src, size, true, file, line) #else -# define STRING_APPEND_PARAMS const char *src -# define APPEND(src, file, line) real_append(src) +# define STRING_APPEND_PARAMS \ + const char *src, \ + size_t size, \ + bool tainted +# define APPEND(src, size, file, line) real_append(src, size, false) +# define APPEND_TAINTED(src, size, file, line) real_append(src, size, true) #endif +#define APPEND_CONST(src) APPEND(src, 0, 0, 0) - -class String { +class String : public Pooled { public: enum { CR_PREALLOCATED_COUNT=5, CR_GROW_PERCENT=60 }; + enum Untaint_lang { + UNKNOWN=0, // when get by name fails + NO, // clean + YES, // tainted, untaint language as assigned later + // untaint languages. assigned by ^untaint[lang]{...} + PASS_APPENDED, + // leave language built into string being appended + // just a flag, that value not stored + AS_IS, + TABLE, + SQL, + JS, + HTML, + HTML_TYPO + }; + public: - void *operator new(size_t size, Pool& apool); String(Pool& apool); - String(String& src); - size_t size() { return fsize; } - int used_rows() { return fused_rows; } - char *cstr(); + String(const String& src); + size_t size() const { return fsize; } + int used_rows() const { return fused_rows; } + char *cstr() const; String& real_append(STRING_APPEND_PARAMS); - bool operator == (String& src); - - uint hash_code(); + int cmp (const String& src) const; + bool operator < (const String& src) const { return cmp(src)<0; } + bool operator > (const String& src) const { return cmp(src)>0; } + bool operator <= (const String& src) const { return cmp(src)<=0; } + bool operator >= (const String& src) const { return cmp(src)>=0; } + bool operator == (const String& src) const { + if(size()!=src.size()) // can speed up in trivial case + return false; + return cmp(src)==0; + } + bool operator != (const String& src) const { return cmp(src)!=0; } - const Origin& origin() const { return head.rows[0].item.origin; } + bool operator == (const char* b_ptr) const; + String& append(const String& src, Untaint_lang lang); -protected: + uint hash_code() const; - // the pool I'm allocated on - Pool& pool; + const Origin& origin() const { return head.rows[0].item.origin; } private: @@ -70,11 +106,14 @@ private: // the number of rows in chunk int count; union Row { - // chunk item - struct { - const char *ptr; // pointer to the start of string fragment - size_t size; // length of the fragment - Origin origin; // origin of this fragment + // fragment + struct { + const char *ptr; // pointer to the start + size_t size; // length + Untaint_lang lang; // untaint flag, later untaint language +#ifndef NO_STRING_ORIGIN + Origin origin; // origin +#endif } item; Chunk *link; // link to the next chunk in chain } rows[CR_PREALLOCATED_COUNT]; @@ -91,8 +130,8 @@ private: Chunk::Row *link_row; private: - // last chank allocated count - int curr_chunk_rows; + // last chunk + Chunk *last_chunk; // string size size_t fsize; @@ -106,6 +145,7 @@ private: return append_here == link_row; } void expand(); + void set_lang(Chunk::Row *row, Untaint_lang lang, size_t size); private: //disabled