--- parser3/src/classes/table.C 2001/03/12 17:00:46 1.2 +++ parser3/src/classes/table.C 2003/04/08 12:47:30 1.172.2.14.2.26 @@ -1,93 +1,823 @@ -/* - Parser - Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) - Author: Alexander Petrosyan (http://design.ru/paf) +/** @file + Parser: @b table parser class. - $Id: table.C,v 1.2 2001/03/12 17:00:46 paf Exp $ + Copyright (c) 2001-2003 ArtLebedev Group (http://www.artlebedev.com) + Author: Alexandr Petrosian (http://paf.design.ru) */ +static const char* IDENT_TABLE_C="$Date: 2003/04/08 12:47:30 $"; + +#include "classes.h" +#include "pa_vmethod_frame.h" + +#include "pa_common.h" #include "pa_request.h" -#include "_table.h" #include "pa_vtable.h" -#include "pa_common.h" +#include "pa_vint.h" +#include "pa_sql_connection.h" +#include "pa_vbool.h" + +// class + +class MTable: public Methoded { +public: // VStateless_class + Value* create_new_value() { return new VTable(); } + +public: + MTable(); + +public: // Methoded + bool used_directly() { return true; } +}; + +// global variable -// global var +DECLARE_CLASS_VAR(table, new MTable, 0); -VClass *table_class; +// defines for globals + +#define SQL_LIMIT_NAME "limit" +#define SQL_OFFSET_NAME "offset" +#define SQL_DEFAULT_NAME "default" +#define SQL_DISTINCT_NAME "distinct" + +// globals + +String sql_limit_name(SQL_LIMIT_NAME); +String sql_offset_name(SQL_OFFSET_NAME); +String sql_default_name(SQL_DEFAULT_NAME); +String sql_distinct_name(SQL_DISTINCT_NAME); // methods +static void get_copy_options(Request& r, MethodParams& params, size_t param_index, + const Table& source, + int& offset, + int& limit) { + + offset=0; + limit=0; + if(params.count()<=param_index) + return; + + Value& voptions=params.as_no_junction(param_index, "options must be hash, not code"); + if(!voptions.is_string()) { + if(HashStringValue* options=voptions.get_hash()) { + int valid_options=0; + if(Value* voffset=options->get(sql_offset_name)) { + valid_options++; + if(voffset->is_string()) { + const String& soffset=*voffset->get_string(); + if(soffset == "cur") + offset=source.current(); + else + throw Exception("parser.runtime", + &soffset, + "must be 'cur' string or expression"); + } else + offset=r.process_to_value(*voffset).as_int(); + } + if(Value* vlimit=options->get(sql_limit_name)) { + valid_options++; + limit=r.process_to_value(*vlimit).as_int(); + if(!limit) // zero limit = should be 'nothing to copy', for methods zero means 'all' + limit=-1; // thus fixing + } + if(valid_options!=options->count()) + throw Exception("parser.runtime", + 0, + "called with invalid option"); + } else + throw Exception("parser.runtime", + 0, + "options must be hash"); + } +} -// TODO: проверить ^set в ^menu & co +static void _create(Request& r, MethodParams& params) { + // clone/copy part? + if(Table *source=params[0].get_table()) { + int offset, limit; + get_copy_options(r, params, 1, *source, + offset, limit); + GET_SELF(r, VTable).set_table(*new Table(*source, offset, limit)); + return; + } -static void set_or_load( - Request& r, - const String& method_name, Array *params, - bool is_load) { - Pool& pool=r.pool(); // data is last parameter - Value *vdata=static_cast(params->get(params->size()-1)); - if(vdata->get_junction()) - R_THROW(0, 0, - &method_name, - "body must not be a junction"); + Temp_lang temp_lang(r, String::L_PASS_APPENDED); + const String& data= + r.process_to_string(params.as_junction(params.count()-1, "body must be code")); - // data or file_name - char *data_or_filename=vdata->as_string().cstr(); - // data - char *data=is_load?file_read(pool, r.absolute(data_or_filename)):data_or_filename; + // parse columns + size_t raw_pos_after=0; + Table::columns_type columns; + if(params.count()==2) { + columns=Table::columns_type(0); // nameless + } else { + columns=Table::columns_type(new ArrayString); + + ArrayString head; + data.split(head, raw_pos_after, "\n", String::L_AS_IS, 1); + if(head.count()) { + size_t col_pos_after=0; + head[0]->split(*columns, col_pos_after, "\t", String::L_AS_IS); + } + } + + Table& table=*new Table(columns); + // parse cells + + ArrayString rows; + data.split(rows, raw_pos_after, "\n", String::L_AS_IS); + Array_iterator i(rows); + while(i.has_next()) { + Table::element_type row(new ArrayString); + const String& string=*i.next(); + // remove comment lines + if(!string.length()) + continue; + + size_t col_pos_after=0; + string.split(*row, col_pos_after, "\t", String::L_AS_IS); + table+=row; + } + + // replace any previous table value + GET_SELF(r, VTable).set_table(table); +} + +static void _load(Request& r, MethodParams& params) { + const String& first_param=params.as_string(0, "file name must be string"); + int filename_param_index=0; + bool nameless=first_param=="nameless"; + if(nameless) + filename_param_index++; + size_t options_param_index=filename_param_index+1; + + // loading text + char *data=file_read_text(r.charsets.source(), + r.absolute(params.as_string(filename_param_index, "file name must be string")), + true, + options_param_indexsize()==2) { - columns=0; + Table::columns_type columns; + if(nameless) { + columns=Table::columns_type(0); // nameless } else { - columns=new(pool) Array(pool); + columns=Table::columns_type(new ArrayString); - if(char *row_chars=getrow(&data)) + while(char *row_chars=getrow(&data)) { + // remove empty&comment lines + if(!*row_chars || *row_chars == '#') + continue; do { - String *name=new(pool) String(pool); - name->APPEND(lsplit(&row_chars, '\t'), 0, file, line++); - *columns+=name; + *columns+=new String(lsplit(&row_chars, '\t'), 0, true); } while(row_chars); + + break; + } } // parse cells - Table& table=*new(pool) Table(pool, method_name, columns); + Table& table=*new Table(columns); char *row_chars; while(row_chars=getrow(&data)) { - Array *row=new(pool) Array(pool); + // remove empty&comment lines + if(!*row_chars || *row_chars == '#') + continue; + Table::element_type row(new ArrayString); while(char *cell_chars=lsplit(&row_chars, '\t')) { - String *cell=new(pool) String(pool); - cell->APPEND(cell_chars, 0, file, line); - *row+=cell; + *row+=new String(cell_chars, 0, true); } - line++; table+=row; }; // replace any previous table value - r.self->as_vtable().set_table(table); + GET_SELF(r, VTable).set_table(table); +} + +/// @todo "x\nx" "xxx""xx" +static void _save(Request& r, MethodParams& params) { + Value& vfile_name=params.as_no_junction(params.count()-1, "file name must not be code"); + + Table& table=GET_SELF(r, VTable).table(); + + bool do_append=false; + String sdata; + if(params.count()==1) { // named output + // write out names line + if(table.columns()) { // named table + for(Array_iterator i(*table.columns()); i.has_next(); ) { + sdata.append(*i.next(), String::L_TABLE); + if(i.has_next()) + sdata.append_know_length("\t", 1, String::L_CLEAN); + } + } else { // nameless table + if(int lsize=table.count()?table[0]->count():0) + for(int column=0; column i(table); + while(i.has_next()) { + for(Array_iterator c(*i.next()); c.has_next(); ) { + sdata.append(*c.next(), String::L_TABLE); + if(c.has_next()) + sdata.append_know_length("\t", 1, String::L_CLEAN); + } + sdata.append_know_length("\n", 1, String::L_CLEAN); + } + + // write + file_write(r.absolute(vfile_name.as_string()), + sdata.cstr(), sdata.length(), true, do_append); +} + +static void _count(Request& r, MethodParams&) { + int result=GET_SELF(r, VTable).table().count(); + r.write_no_lang(*new VInt(result)); +} + +static void _line(Request& r, MethodParams&) { + int result=1+GET_SELF(r, VTable).table().current(); + r.write_no_lang(*new VInt(result)); +} + +static void _offset(Request& r, MethodParams& params) { + Table& table=GET_SELF(r, VTable).table(); + if(params.count()) { + bool absolute=false; + if(params.count()>1) { + const String& whence=params.as_string(0, "whence must be string"); + if(whence=="cur") + absolute=false; + else if(whence=="set") + absolute=true; + else + throw Exception("parser.runtime", + &whence, + "is invalid whence, valid are 'cur' or 'set'"); + } + + Value& offset_expr=params.as_junction(params.count()-1, "offset must be expression"); + table.offset(absolute, r.process_to_value(offset_expr).as_int()); + } else + r.write_no_lang(*new VInt(table.current())); +} + +static void _menu(Request& r, MethodParams& params) { + Value& body_code=params.as_junction(0, "body must be code"); + + Value* delim_maybe_code=params.count()>1?¶ms[1]:0; + + Table& table=GET_SELF(r, VTable).table(); + bool need_delim=false; + int saved_current=table.current(); + int size=table.count(); + for(int row=0; rowlength()) { // delimiter set and we have body + if(need_delim) // need delim & iteration produced string? + r.write_pass_lang(r.process(*delim_maybe_code)); + need_delim=true; + } + r.write_pass_lang(sv_processed); + } + table.set_current(saved_current); +} + +#ifndef DOXYGEN +struct Row_info { + Request *r; + Table *table; + Value* key_code; + size_t key_field; + Array* value_fields; + HashStringValue* hash; + bool distinct; + size_t row; +}; +#endif +static void table_row_to_hash(Table::element_type row, Row_info *info) { + const String* key; + if(info->key_code) { + info->table->set_current(info->row++); // change context row + StringOrValue sv_processed=info->r->process(*info->key_code); + key=&sv_processed.as_string(); + } else + key=info->key_fieldcount()?row->get(info->key_field):0; + + if(!key) + return; // ignore rows without key [too-short-record_array if-indexed] + + VHash* vhash=new VHash; + HashStringValue& hash=vhash->hash(); + for(Array_iterator i(*info->value_fields); i.has_next(); ) { + size_t value_field=i.next(); + if(value_fieldcount()) + hash.put( + *info->table->columns()->get(value_field), + new VString(*row->get(value_field))); + } + + if(info->hash->put_dont_replace(*key, vhash)) // put. existed? + if(!info->distinct) + throw Exception("parser.runtime", + key, + "duplicate key"); +} +static void _hash(Request& r, MethodParams& params) { + Table& self_table=GET_SELF(r, VTable).table(); + VHash& result=*new VHash; + if(Table::columns_type columns=self_table.columns()) + if(columns->count()>0) { + bool distinct=false; + int param_index=params.count()-1; + if(param_index>0) { + if(HashStringValue* options= + params.as_no_junction(param_index, "param must not be code").get_hash()) { + --param_index; + int valid_options=0; + if(Value* vdistinct=options->get(sql_distinct_name)) { + valid_options++; + distinct=r.process_to_value(*vdistinct).as_bool(); + } + if(valid_options!=options->count()) + throw Exception("parser.runtime", + 0, + "called with invalid option"); + } + } + if(param_index==2) // bad options param type + throw Exception("parser.runtime", + 0, + "options must be hash"); + + Array value_fields; + if(param_index>0) { + Value& value_fields_param=params.as_no_junction(param_index, "value field(s) must not be code"); + if(value_fields_param.is_string()) { + value_fields+=self_table.column_name2index( + *value_fields_param.get_string(), true); + } else if(Table* value_fields_table=value_fields_param.get_table()) { + for(Array_iterator i(*value_fields_table); + i.has_next(); ) { + const String& value_field_name + =*i.next()->get(0); + value_fields + +=self_table.column_name2index(value_field_name, true); + } + } else + throw Exception("parser.runtime", + 0, + "value field(s) must be string or self_table" + ); + } else { // by all columns, including key + for(size_t i=0; icount(); i++) + value_fields+=i; + } + + + { + Row_info info; + info.r=&r; + info.table=&self_table; + Value* key_param=¶ms[0]; + info.key_code=key_param->get_junction()?key_param:0; + info.key_field=info.key_code?-1 + :self_table.column_name2index(key_param->as_string(), true); + info.value_fields=&value_fields; + info.hash=&result.hash(); + info.distinct=distinct; + info.row=0; + + int saved_current=self_table.current(); + self_table.for_each(table_row_to_hash, &info); + self_table.set_current(saved_current); + } + } + r.write_no_lang(result); +} + +#ifndef DOXYGEN +struct Table_seq_item { + ArrayString* row; + union { + const char *c_str; + double d; + } value; +}; +#endif +static int sort_cmp_string(const void *a, const void *b) { + return strcmp( + static_cast(a)->value.c_str, + static_cast(b)->value.c_str + ); +} +static int sort_cmp_double(const void *a, const void *b) { + double va=static_cast(a)->value.d; + double vb=static_cast(b)->value.d; + if(vavb) + return +1; + else + return 0; +} +static void _sort(Request& r, MethodParams& params) { + Value& key_maker=params.as_junction(0, "key-maker must be code"); + + bool reverse=params.count()>1/*..[desc|asc|]*/? + reverse=params.as_no_junction(1, "order must not be code").as_string()=="desc": + false; // default=asc + + Table& old_table=GET_SELF(r, VTable).table(); + Table& new_table=*new Table(old_table.columns()); + + Table_seq_item* seq=new(PointerFreeGC) Table_seq_item[old_table.count()]; + int i; + + // calculate key values + bool key_values_are_strings=true; + int old_count=old_table.count(); + for(i=0; i1) + throw Exception("parser.runtime", + 0, + "locate by expression has only one parameter - expression"); + + Value& expression_code=params.as_junction(0, "must be expression"); + + Table& table=GET_SELF(r, VTable).table(); + int saved_current=table.current(); + int size=table.count(); + for(int row=0; row2) + throw Exception("parser.runtime", + 0, + "locate by name and value has only two parameters - name and value"); + + Table& table=GET_SELF(r, VTable).table(); + return table.locate( + params.as_string(0, "column name must be string"), + params.as_string(1, "value must be string") + ); +} +static void _locate(Request& r, MethodParams& params) { + bool result=params[0].get_junction()? + _locate_expression(r, params) : + _locate_name_value(r, params); + r.write_no_lang(*new VBool(result)); +} + +static void _flip(Request& r, MethodParams& params) { + Table& old_table=GET_SELF(r, VTable).table(); + Table& new_table=*new Table(old_table.columns()); + if(size_t old_count=old_table.count()) + if(size_t old_cols=old_table[0]->count()) + for(size_t column=0; columncount()?old_row->get(column):new String; + } + new_table+=new_row; + } + + r.write_no_lang(*new VTable(&new_table)); +} + +static void _append(Request& r, MethodParams& params) { + // data + Temp_lang temp_lang(r, String::L_PASS_APPENDED); + const String& string=r.process_to_string(params.as_junction(0, "body must be code")); + + // parse cells + Table::element_type row=new ArrayString; + size_t pos_after=0; + string.split(*row, pos_after, "\t", String::L_AS_IS); + + GET_SELF(r, VTable).table()+=row; +} + +static void _join(Request& r, MethodParams& params) { + Table* maybe_src=params.as_no_junction(0, "table ref must not be code").get_table(); + if(!maybe_src) + throw Exception("parser.runtime", + 0, + "source is not a table"); + + Table& src=*maybe_src; + Table& dest=GET_SELF(r, VTable).table(); + if(&src == &dest) + throw Exception("parser.runtime", + 0, + "source and destination are same table"); + + int offset, limit; + get_copy_options(r, params, 1, src, + offset, limit); + + if(Table::columns_type dest_columns=dest.columns()) { // dest is named + int saved_src_current=src.current(); + int m=src.count()-offset; + if(!limit || limit>m) + limit=m; + int end=offset+limit; + for(int src_row=offset; src_rowcount(); dest_column++) { + const String* src_item=src.item(*dest_columns->get(dest_column)); + *dest_row+=src_item?src_item:new String; + } + dest+=dest_row; + } + src.set_current(saved_src_current); + } else { // dest is nameless + size_t src_count=src.count(); + for(size_t src_row=0; src_row1) { + Value& voptions=params.as_no_junction(1, "options must be hash, not code"); + if(!voptions.is_string()) + if(HashStringValue* options=voptions.get_hash()) { + int valid_options=0; + if(Value* vlimit=options->get(sql_limit_name)) { + valid_options++; + limit=(ulong)r.process_to_value(*vlimit).as_double(); + } + if(Value* voffset=options->get(sql_offset_name)) { + valid_options++; + offset=(ulong)r.process_to_value(*voffset).as_double(); + } + if(valid_options!=options->count()) + throw Exception("parser.runtime", + 0, + "called with invalid option"); + } else + throw Exception("parser.runtime", + 0, + "options must be hash"); + } + + Temp_lang temp_lang(r, String::L_SQL); + const String& statement_string=r.process_to_string(statement); + const char* statement_cstr= + statement_string.cstr(String::L_UNSPECIFIED, r.connection()); + Table_sql_event_handlers handlers; +#ifdef RESOURCES_DEBUG + struct timeval mt[2]; + //measure:before + gettimeofday(&mt[0],NULL); +#endif + r.connection()->query( + statement_cstr, offset, limit, + handlers, + statement_string); + +#ifdef RESOURCES_DEBUG + //measure:after connect + gettimeofday(&mt[1],NULL); + + double t[2]; + for(int i=0;i<2;i++) + t[i]=mt[i].tv_sec+mt[i].tv_usec/1000000.0; + + r.sql_request_time+=t[1]-t[0]; +#endif + + Table& result= + handlers.table?*handlers.table: // query resulted in table? return it + *new Table(Table::columns_type(0)); // query returned no table, fake it + + // replace any previous table value + GET_SELF(r, VTable).set_table(result); } +static void _columns(Request& r, MethodParams&) { -static void _set(Request& r, const String& method_name, Array *params) { - set_or_load(r, method_name, params, false); + Table::columns_type result_columns(new ArrayString); + *result_columns+=new String("column"); + Table& result_table=*new Table(result_columns); + + Table& source_table=GET_SELF(r, VTable).table(); + if(Table::columns_type source_columns=source_table.columns()) { + for(Array_iterator i(*source_columns); i.has_next(); ) { + Table::element_type result_row(new ArrayString); + *result_row+=i.next(); + result_table+=result_row; + } + } + + r.write_no_lang(*new VTable(&result_table)); } -static void _load(Request& r, const String& method_name, Array *params) { - set_or_load(r, method_name, params, true); +static void _select(Request& r, MethodParams& params) { + Value& vcondition=params.as_junction(0, "condition must be expression"); + + Table& source_table=GET_SELF(r, VTable).table(); + Table& result_table=*new Table(source_table.columns()); + + int saved_current=source_table.current(); + int size=source_table.count(); + for(int row=0; row