--- parser3/src/classes/table.C 2001/03/25 08:52:28 1.26 +++ parser3/src/classes/table.C 2001/05/08 06:00:34 1.72 @@ -1,53 +1,96 @@ /** @file - Parser: table parser class. + Parser: @b table parser class. Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) Author: Alexander Petrosyan (http://design.ru/paf) - $Id: table.C,v 1.26 2001/03/25 08:52:28 paf Exp $ + $Id: table.C,v 1.72 2001/05/08 06:00:34 paf Exp $ */ #include "pa_config_includes.h" + +#include "pcre.h" + +#include "classes.h" #include "pa_common.h" #include "pa_request.h" -#include "_table.h" #include "pa_vtable.h" #include "pa_vint.h" +#include "pa_sql_connection.h" +#include "pa_dir.h" +#include "pa_vbool.h" + +// defines + +#define TABLE_CLASS_NAME "table" -// global var +// class -VStateless_class *table_class; +class MTable : public Methoded { +public: // VStateless_class + Value *create_new_value(Pool& pool) { return new(pool) VTable(pool); } + +public: + MTable(Pool& pool); + +public: // Methoded + bool used_directly() { return true; } +}; // methods -static void set_or_load( - Request& r, - const String& method_name, Array *params, - bool is_load) { +static void _set(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); // data is last parameter - Value *vdata_or_filename=static_cast(params->get(params->size()-1)); - // forcing - // ^load[this file name type] - // ^set{this body type} - r.fail_if_junction_(is_load, *vdata_or_filename, - method_name, is_load?"file name must not be junction":"body must be junction"); - - // data or file_name - char *data; - if(is_load) { - // forcing untaint language - String lfile_name(pool); - lfile_name.append(vdata_or_filename->as_string(), String::UL_FILE_NAME, true); - // loading text - data=file_read_text(pool, r.absolute(lfile_name)); + Value& vdata=params->get_junction(params->size()-1, "body must be code"); + + Temp_lang temp_lang(r, String::UL_PASS_APPENDED); + const String& data=r.process(vdata).as_string(); + + size_t pos_after=0; + // parse columns + Array *columns; + if(params->size()==2) { + columns=0; } else { - // suggesting untaint language - Temp_lang temp_lang(r, String::UL_TABLE); - data=r.process(*vdata_or_filename).as_string().cstr(); + columns=new(pool) Array(pool); + + Array head(pool); + data.split(head, &pos_after, "\n", 1, String::UL_CLEAN, 1); + if(head.size()) + head.get_string(0)->split(*columns, 0, "\t", 1, String::UL_CLEAN); + } + + Table& table=*new(pool) Table(pool, &method_name, columns); + // parse cells + Array rows(pool); + data.split(rows, &pos_after, "\n", 1, String::UL_CLEAN); + int size=rows.quick_size(); + for(int i=0; i(r.self)->set_table(table); +} + +static void _load(Request& r, const String& method_name, MethodParams *params) { + Pool& pool=r.pool(); + // filename is last parameter + Value& vfilename=params->get_no_junction(params->size()-1, + "file name must not be code"); + + // loading text + char *data=file_read_text(pool, r.absolute(vfilename.as_string())); + // parse columns Array *columns; #ifndef NO_STRING_ORIGIN @@ -63,19 +106,21 @@ static void set_or_load( if(char *row_chars=getrow(&data)) do { String *name=new(pool) String(pool); - name->APPEND(lsplit(&row_chars, '\t'), 0, file, line++); + name->APPEND_TAINTED(lsplit(&row_chars, '\t'), 0, file, line++); *columns+=name; } while(row_chars); } // parse cells - Table& table=*new(pool) Table(pool, columns); + Table& table=*new(pool) Table(pool, &method_name, columns); char *row_chars; while(row_chars=getrow(&data)) { + if(!*row_chars) // remove empty lines + continue; Array *row=new(pool) Array(pool); while(char *cell_chars=lsplit(&row_chars, '\t')) { String *cell=new(pool) String(pool); - cell->APPEND(cell_chars, 0, file, line); + cell->APPEND_TAINTED(cell_chars, 0, file, line); *row+=cell; } line++; @@ -86,45 +131,28 @@ static void set_or_load( static_cast(r.self)->set_table(table); } - -static void _set(Request& r, const String& method_name, Array *params) { - set_or_load(r, method_name, params, false); -} - -static void _load(Request& r, const String& method_name, Array *params) { - set_or_load(r, method_name, params, true); -} - -static void _save(Request& r, const String& method_name, Array *params) { +static void _save(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); - Value *vfile_name=static_cast(params->get(params->size()-1)); - // forcing - // ^save[this body type] - r.fail_if_junction_(true, *vfile_name, - method_name, "file name must not be junction"); - - // forcing untaint language - String lfile_name(pool); - lfile_name.append(vfile_name->as_string(), - String::UL_FILE_NAME, true); + Value& vtable_name=params->get_no_junction(params->size()-1, + "file name must not be code"); Table& table=static_cast(r.self)->table(); String sdata(pool); if(params->size()==1) { // not nameless=named output // write out names line - if(const Array *columns=table.columns()) { // named table - for(int column=0; columnsize(); column++) { + if(table.columns()) { // named table + for(int column=0; columnsize(); column++) { if(column) sdata.APPEND_CONST("\t"); - sdata.append(*static_cast(columns->quick_get(column)), + sdata.append(*static_cast(table.columns()->quick_get(column)), String::UL_TABLE); } } else { // nameless table - int size=table.size()?static_cast(table.get(0))->size():0; - if(size) - for(int column=0; column(table.get(0))->size():0; + if(lsize) + for(int column=0; column(r.self)->table().size()); r.write_no_lang(value); } -static void _line(Request& r, const String&, Array *) { +static void _line(Request& r, const String& method_name, MethodParams *) { Pool& pool=r.pool(); - Value& value=*new(pool) VInt(pool, 1+static_cast(r.self)->table().get_current()); + Value& value=*new(pool) VInt(pool, 1+static_cast(r.self)->table().current()); r.write_no_lang(value); } -static void _offset(Request& r, const String&, Array *params) { +static void _offset(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); Table& table=static_cast(r.self)->table(); - if(params->size()) { - if(int size=table.size()) { - int offset= - (int)r.process(*static_cast(params->get(0))).get_double(); - table.set_current((table.get_current()+offset+size)%size); - } - } else { - Value& value=*new(pool) VInt(pool, table.get_current()); + if(params->size()) + table.shift((int)r.process(params->get(0)).as_double()); + else { + Value& value=*new(pool) VInt(pool, table.current()); r.write_no_lang(value); } } -static void _menu(Request& r, const String& method_name, Array *params) { - Value& body_code=*static_cast(params->get(0)); - // forcing ^menu{this param type} - r.fail_if_junction_(false, body_code, - method_name, "body must be junction"); +static void _menu(Request& r, const String& method_name, MethodParams *params) { + Value& body_code=params->get_junction(0, "body must be code"); - Value *delim_code=params->size()==2?static_cast(params->get(1)):0; + Value *delim_code=params->size()==2?¶ms->get(1):0; - Table& table=static_cast(r.self)->table(); + VTable& vtable=*static_cast(r.self); + Table& table=vtable.table(); bool need_delim=false; + vtable.lock(); int saved_current=table.current(); for(int row=0; row(r.self)->table(); + if(table.size()==0) + r.write_pass_lang(r.process(params->get(0))); + else if(params->size()>1) + r.write_pass_lang(r.process(params->get(1))); +} + +/// used by table: _record / store_column_item_to_hash +struct Record_info { + Pool *pool; + Table *table; + Hash *hash; +}; +static void store_column_item_to_hash(Array::Item *item, void *info) { + Record_info& ri=*static_cast(info); + String& column_name=*static_cast(item); + const String *column_item=ri.table->item(column_name); + Value *value; + if(column_item) + value=new(*ri.pool) VString(*column_item); + else + value=new(*ri.pool) VUnknown(*ri.pool); + ri.hash->put(column_name, value); +} +static void _record(Request& r, const String& method_name, MethodParams *params) { + Table& table=static_cast(r.self)->table(); + if(const Array *columns=table.columns()) { + Pool& pool=r.pool(); + Value& value=*new(pool) VHash(pool); + Record_info record_info={&pool, &table, value.get_hash()}; + columns->for_each(store_column_item_to_hash, &record_info); + + r.write_no_lang(value); + } +} + +struct Seq_item { + Array *row; + union { + char *c_str; + double d; + } value; +}; +static int sort_cmp_string(const void *a, const void *b) { + return strcmp( + static_cast(a)->value.c_str, + static_cast(b)->value.c_str + ); } +static int sort_cmp_double(const void *a, const void *b) { + double va=static_cast(a)->value.d; + double vb=static_cast(b)->value.d; + if(vavb) + return +1; + else + return 0; +} +static void _sort(Request& r, const String& method_name, MethodParams *params) { + Value& key_maker=params->get_junction(0, "key-maker must be code"); + + bool reverse=params->size()==2/*..[asc|desc]*/? + reverse=params->get_no_junction(1, "order must not be code").as_string()=="desc": + false; -static void _empty(Request& r, const String&, Array *params) { Table& table=static_cast(r.self)->table(); - if(table.size()==0) { - Value& value=r.process(*static_cast(params->get(0))); - r.write_pass_lang(value); - } else if(params->size()==2) { - Value& value=r.process(*static_cast(params->get(1))); - r.write_pass_lang(value); + + // anything to sort? + if(!table.size()) + return; + + Seq_item *seq=(Seq_item *)malloc(sizeof(Seq_item)*table.size()); + int i; + + // calculate key values + bool key_values_are_strings=true; + for(i=0; i(r.self); + Table& table=vtable.table(); + Value& result=*new(pool) VBool(pool, table.locate( + params->get(0).as_string(), + params->get(1).as_string())); + result.set_name(method_name); + r.write_no_lang(result); +} + +static void _flip(Request& r, const String& method_name, MethodParams *params) { + Pool& pool=r.pool(); + VTable& vtable=*static_cast(r.self); + + Table& old_table=*vtable.get_table(); + Table& new_table=*new(pool) Table(pool, &method_name, 0/*nameless*/); + if(old_table.size()) + if(int old_cols=old_table.at(0).size()) + for(int column=0; columnget_junction(0, "body must be code")).as_string(); + + // parse cells + Array& row=*new(pool) Array(pool); + string.split(row, 0, "\t", 1, String::UL_CLEAN); + + VTable& vtable=*static_cast(r.self); + // disable ^a.menu{^a.append[]} + vtable.lock(); + vtable.table()+=&row; + vtable.unlock(); +} + +static void _join(Request& r, const String& method_name, MethodParams *params) { + Pool& pool=r.pool(); + + Table *maybe_src=params->get_no_junction(0, "table ref must not be code").get_table(); + if(!maybe_src) + PTHROW(0, 0, + &method_name, + "source is not a table"); + + Table& src=*maybe_src; + Table& dest=static_cast(r.self)->table(); + if(&src == &dest) + PTHROW(0, 0, + &method_name, + "source and destination are same table"); + + if(const Array *dest_columns=dest.columns()) { // dest is named + int saved_src_current=src.current(); + for(int src_row=0; src_rowsize(); dest_column++) + dest_row+=src.item(*dest_columns->get_string(dest_column)); + dest+=&dest_row; + } + src.set_current(saved_src_current); + } else { // dest is nameless + for(int src_row=0; src_rowget_junction(0, "statement must be code"); + + ulong limit=0; + if(params->size()>1) { + Value& limit_code=params->get_junction(1, "limit must be expression"); + limit=(uint)r.process(limit_code).as_double(); + } + + ulong offset=0; + if(params->size()>2) { + Value& offset_code=params->get_junction(2, "offset must be expression"); + offset=(ulong)r.process(offset_code).as_double(); + } + + Temp_lang temp_lang(r, String::UL_SQL); + const String& statement_string=r.process(statement).as_string(); + const char *statement_cstr= + statement_string.cstr(String::UL_UNSPECIFIED, r.connection); + unsigned int sql_column_count; SQL_Driver::Cell *sql_columns; + unsigned long sql_row_count; SQL_Driver::Cell **sql_rows; + bool need_rethrow=false; Exception rethrow_me; + PTRY { + r.connection->query( + statement_cstr, offset, limit, + &sql_column_count, &sql_columns, + &sql_row_count, &sql_rows); + } + PCATCH(e) { // connect/process problem + rethrow_me=e; need_rethrow=true; + } + PEND_CATCH + if(need_rethrow) + PTHROW(rethrow_me.type(), rethrow_me.code(), + &statement_string, // setting more specific source [were url] + rethrow_me.comment()); + + Array& table_columns=*new(pool) Array(pool); + for(unsigned int i=0; i(r.self)->set_table(table); +} + +static void _dir(Request& r, const String& method_name, MethodParams *params) { + Pool& pool=r.pool(); + + Value& relative_path=params->get_no_junction(0, "path must not be code"); + + const String *regexp; + pcre *regexp_code; + int ovecsize; + int *ovector; + if(params->size()>1) { + regexp=¶ms->get_no_junction(1, "regexp must not be code").as_string(); + + const char *pattern=regexp->cstr(String::UL_AS_IS); + const char *errptr; + int erroffset; + regexp_code=pcre_compile(pattern, PCRE_EXTRA | PCRE_DOTALL, + &errptr, &erroffset, + r.pcre_tables); + + if(!regexp_code) + PTHROW(0, 0, + ®exp->mid(erroffset, regexp->size()), + "regular expression syntax error - %s", errptr); + + ovector=(int *)malloc(sizeof(int)*(ovecsize=(1/*match*/)*3)); + } else + regexp_code=0; + + + const char* absolute_path_cstr=r.absolute(relative_path.as_string()) + .cstr(String::UL_FILE_NAME); + + Array& columns=*new(pool) Array(pool); + columns+=new(pool) String(pool, "name"); + Table& table=*new(pool) Table(pool, &method_name, &columns); + + LOAD_DIR(absolute_path_cstr, + size_t file_name_size=strlen(ffblk.ff_name); + bool suits=true; + if(regexp_code) { + int exec_result=pcre_exec(regexp_code, 0, + ffblk.ff_name, file_name_size, 0, + 0, ovector, ovecsize); + + if(exec_result==PCRE_ERROR_NOMATCH) + suits=false; + else if(exec_result<0) { + (*pcre_free)(regexp_code); + PTHROW(0, 0, + regexp, + "regular expression execute (%d)", + exec_result); + } + } + + if(suits) { + char *file_name_cstr=(char *)r.malloc(file_name_size); + memcpy(file_name_cstr, ffblk.ff_name, file_name_size); + String &file_name=*new(pool) String(pool); + file_name.APPEND(file_name_cstr, file_name_size, String::UL_FILE_NAME, + method_name.origin().file, method_name.origin().line); + + Array& row=*new(pool) Array(pool); + row+=&file_name; + table+=&row; + } + ); + + if(regexp_code) + (*pcre_free)(regexp_code); + + // replace any previous table value + static_cast(r.self)->set_table(table); } -// initialize +// constructor -void initialize_table_class(Pool& pool, VStateless_class& vclass) { - // ^table.set{data} - // ^table.set[nameless]{data} - vclass.add_native_method("set", _set, 1, 2); +MTable::MTable(Pool& apool) : Methoded(apool) { + set_name(*NEW String(pool(), TABLE_CLASS_NAME)); - // ^table.load[file] - // ^table.load[nameless;file] - vclass.add_native_method("load", _load, 1, 2); + // ^table:set{data} + // ^table:set[nameless]{data} + add_native_method("set", Method::CT_DYNAMIC, _set, 1, 2); + + // ^table:load[file] + // ^table:load[nameless;file] + add_native_method("load", Method::CT_DYNAMIC, _load, 1, 2); // ^table.save[file] // ^table.save[nameless;file] - vclass.add_native_method("save", _save, 1, 2); + add_native_method("save", Method::CT_DYNAMIC, _save, 1, 2); // ^table.count[] - vclass.add_native_method("count", _count, 0, 0); + add_native_method("count", Method::CT_DYNAMIC, _count, 0, 0); // ^table.line[] - vclass.add_native_method("line", _line, 0, 0); + add_native_method("line", Method::CT_DYNAMIC, _line, 0, 0); // ^table.offset[] // ^table.offset[offset] - vclass.add_native_method("offset", _offset, 0, 1); + add_native_method("offset", Method::CT_DYNAMIC, _offset, 0, 1); // ^table.menu{code} // ^table.menu{code}[delim] - vclass.add_native_method("menu", _menu, 1, 2); + add_native_method("menu", Method::CT_DYNAMIC, _menu, 1, 2); // ^table.empty{code-when-empty} // ^table.empty{code-when-empty}{code-when-not} - vclass.add_native_method("empty", _empty, 1, 2); + add_native_method("empty", Method::CT_DYNAMIC, _empty, 1, 2); + + // ^table.record[] + add_native_method("record", Method::CT_DYNAMIC, _record, 0, 0); + + // ^table.sort{string-key-maker} ^table.sort{string-key-maker}[asc|desc] + // ^table.sort(numeric-key-maker) ^table.sort(numeric-key-maker)[asc|desc] + add_native_method("sort", Method::CT_DYNAMIC, _sort, 1, 2); + + // ^table.locate[field;value] + add_native_method("locate", Method::CT_DYNAMIC, _locate, 2, 2); + + // ^table.flip[] + add_native_method("flip", Method::CT_DYNAMIC, _flip, 0, 0); + + // ^table.append{r{tab}e{tab}c{tab}o{tab}r{tab}d} + add_native_method("append", Method::CT_DYNAMIC, _append, 1, 1); + + // ^table.join[table] + add_native_method("join", Method::CT_DYNAMIC, _join, 1, 1); + -} + // ^table:sql[query][(count[;offset])] + add_native_method("sql", Method::CT_DYNAMIC, _sql, 1, 3); + + // ^table:dir[path] + // ^table:dir[path][regexp] + add_native_method("dir", Method::CT_DYNAMIC, _dir, 1, 2); +} + +// global variable + +Methoded *table_class; + +// creator + +Methoded *MTable_create(Pool& pool) { + return table_class=new(pool) MTable(pool); +}