File:
[parser3project] /
parser3 /
src /
classes /
string.C
Revision
1.119:
download - view:
text,
annotated -
select for diffs -
revision graph
Thu Aug 29 12:22:46 2002 UTC (23 years, 9 months ago) by
paf
Branches:
MAIN
CVS tags:
HEAD
junction_cleaner moved to auto VMethodFrame [called less frequent, allowed to remove ugly Junction.change_context-s from many places, switch, mail:send..html{}, ..]
request.root renamed to method_frame [more easyreading]
ancient {...PUSH/POPs...} changed to stack vars [speed up]
/** @file
Parser: @b string parser class.
Copyright (c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com)
Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)
*/
static const char* IDENT_STRING_C="$Date: 2002/08/29 12:22:46 $";
#include "classes.h"
#include "pa_request.h"
#include "pa_vdouble.h"
#include "pa_vint.h"
#include "pa_vtable.h"
#include "pa_vbool.h"
#include "pa_string.h"
#include "pa_sql_connection.h"
#include "pa_dictionary.h"
#include "pa_vmethod_frame.h"
// class
class MString : public Methoded {
public:
MString(Pool& pool);
public: // Methoded
bool used_directly() { return true; }
};
// methods
static void _length(Request& r, const String& method_name, MethodParams *) {
Pool& pool=r.pool();
double result=r.self->get_string()->size();
r.write_no_lang(*new(pool) VDouble(pool, result));
}
static void _int(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
int converted;
Value *default_code=params->size()>0?
default_code=¶ms->as_junction(0, "default must be int"):0; // (default)
try {
converted=r.self->as_int();
} catch(...) { // convert problem
if(!default_code) // we have a problem when no default
/*re*/throw;
else
converted=r.process_to_value(*default_code).as_int();
}
r.write_no_lang(*new(pool) VInt(pool, converted));
}
static void _double(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
double converted;
Value *default_code=params->size()>0?
default_code=¶ms->as_junction(0, "default must be double"):0; // (default)
try {
converted=r.self->as_double();
} catch(...) { // convert problem
if(!default_code) // we have a problem when no default
/*re*/throw;
else
converted=r.process_to_value(*default_code).as_double();
}
r.write_no_lang(*new(pool) VDouble(pool, converted));
}
/*not static*/void _string_format(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
Value& fmt_maybe_code=params->get(0);
// for some time due to stupid {} in original design
const String& fmt=r.process_to_string(fmt_maybe_code);
char *buf=format(pool, r.self->as_double(), fmt.cstr());
String result(pool);
result.APPEND_CLEAN(buf, 0,
method_name.origin().file,
method_name.origin().line);
r.write_no_lang(result);
}
static void _left(Request& r, const String&, MethodParams *params) {
Pool& pool=r.pool();
size_t n=(size_t)params->as_int(0, "n must be int", r);
const String& string=static_cast<VString *>(r.self)->string();
r.write_assign_lang(string.mid(0, n));
}
static void _right(Request& r, const String&, MethodParams *params) {
Pool& pool=r.pool();
size_t n=(size_t)params->as_int(0, "n must be int", r);
const String& string=static_cast<VString *>(r.self)->string();
r.write_assign_lang(string.mid(string.size()-n, string.size()));
}
static void _mid(Request& r, const String&, MethodParams *params) {
Pool& pool=r.pool();
const String& string=*r.self->get_string();
size_t p=(size_t)max(0, params->as_int(0, "p must be int", r));
size_t n=params->size()>1?
(size_t)max(0, params->as_int(1, "n must be int", r)):string.size();
r.write_assign_lang(string.mid(p, p+n));
}
static void _pos(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
Value& substr=params->as_no_junction(0, "substr must not be code");
const String& string=static_cast<VString *>(r.self)->string();
r.write_assign_lang(*new(pool) VInt(pool, string.pos(substr.as_string())));
}
static void split_list(Request& r, const String& method_name,
MethodParams *params, int paramIndex,
const String& string,
Array& result) {
Value& delim_value=params->as_no_junction(paramIndex, "delimiter must not be code");
string.split(result, 0, delim_value.as_string());
}
#define SPLIT_LEFT 0x0001
#define SPLIT_RIGHT 0x0010
#define SPLIT_HORIZONTAL 0x0100
#define SPLIT_VERTICAL 0x1000
static int split_options(const String *options) {
struct Split_option {
const char *keyL;
const char *keyU;
int setBit;
int checkBit;
} split_option[]={
{"l", "L", SPLIT_LEFT, SPLIT_RIGHT}, // 0xVHRL
{"r", "R", SPLIT_RIGHT, SPLIT_LEFT},
{"h", "H", SPLIT_HORIZONTAL, SPLIT_VERTICAL},
{"v", "V", SPLIT_VERTICAL, SPLIT_HORIZONTAL},
{0}
};
int result=0;
if(options) {
for(Split_option *o=split_option; o->keyL; o++)
if(options->pos(o->keyL)>=0
|| (o->keyU && options->pos(o->keyU)>=0)) {
if(result & o->checkBit)
throw Exception("parser.runtime",
options,
"conflicting split options");
result |= o->setBit;
}
}
return result;
}
static Table *split_vertical(Request& r, const String& string, Array& pieces, bool right) {
Pool& pool=r.pool();
Array& columns=*new(pool) Array(pool);
columns+=new(pool) String(pool, "piece");
Table& table=*new(pool) Table(pool, &string,
&columns, pieces.size());
if(right) { // right
for(int i=pieces.size(); --i>=0; ) {
Array& row=*new(pool) Array(pool);
row+=pieces.get(i);
table+=&row;
}
} else { // left
Array_iter i(pieces);
while(i.has_next()) {
Array& row=*new(pool) Array(pool);
row+=i.next();
table+=&row;
}
}
return &table;
}
static Table *split_horizontal(Request& r, const String& string, Array& pieces, bool right) {
Pool& pool=r.pool();
Table& table=*new(pool) Table(pool, &string, 0 /* nameless */);
Array& row=*new(pool) Array(pool);
if(right) { // right
for(int i=pieces.size(); --i>=0; ) {
row+=pieces.get(i);
}
} else { // left
Array_iter i(pieces);
while(i.has_next()) {
row+=i.next();
}
}
table+=&row;
return &table;
}
static void split_with_options(Request& r, const String& method_name, MethodParams *params,
int bits) {
Pool& pool=r.pool();
const String& string=*r.self->get_string();
Array pieces(pool);
split_list(r, method_name, params, 0,
string, pieces);
if(!bits) {
const String *options=0;
if(params->size()>1) {
options=¶ms->as_string(1, "options must not be code");
}
bits=split_options(options);
}
bool right=(bits & SPLIT_RIGHT) != 0;
bool horizontal=(bits & SPLIT_HORIZONTAL) !=0;
Table *table;
if(horizontal)
table=split_horizontal(r, string, pieces, right);
else
table=split_vertical(r, string, pieces, right);
r.write_no_lang(*new(pool) VTable(pool, table));
}
static void _split(Request& r, const String& method_name, MethodParams *params) {
split_with_options(r, method_name, params, 0 /* maybe-determine from param #2 */);
}
static void _lsplit(Request& r, const String& method_name, MethodParams *params) {
split_with_options(r, method_name, params, SPLIT_LEFT);
}
static void _rsplit(Request& r, const String& method_name, MethodParams *params) {
split_with_options(r, method_name, params, SPLIT_RIGHT);
}
static void search_action(Table& table, Array *row, int, int, int, int, void *) {
if(row)
table+=row;
}
#ifndef DOXYGEN
struct Replace_action_info {
Request *request; const String *origin;
const String *src; String *dest;
VTable *vtable;
Value *replacement_code;
};
#endif
/// @todo they can do $global[$result] there, getting pointer to later-invalid local var, kill this
static void replace_action(Table& table, Array *row,
int prestart, int prefinish,
int poststart, int postfinish,
void *info) {
Replace_action_info& ai=*static_cast<Replace_action_info *>(info);
if(row) { // begin&middle
// piece from last match['prestart'] to beginning of this match['prefinish']
if(prestart!=prefinish)
*ai.dest << ai.src->mid(prestart, prefinish);//ai.dest->APPEND_CONST("-");
// store found parts in one-record VTable
if(table.size()) // middle
table.put(0, row);
else // begin
table+=row;
{ // execute 'replacement_code' in 'table' context
ai.vtable->set_table(table);
*ai.dest << ai.request->process_to_string(*ai.replacement_code);
}
} else // end
*ai.dest << ai.src->mid(poststart, postfinish);
}
/// @todo use pcre:study somehow
static void _match(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
Value& regexp=params->as_no_junction(0, "regexp must not be code");
const String *options=
params->size()>1?
¶ms->as_no_junction(1, "options must not be code").as_string():0;
Temp_lang temp_lang(r, String::UL_PASS_APPENDED);
Table *table;
if(params->size()<3) { // search
const String& src=static_cast<VString *>(r.self)->string();
bool was_global;
bool matched=src.match(
&method_name,
regexp.as_string(), options,
&table,
search_action, 0,
&was_global);
Value *result;
// matched
// not (just matched[3=pre/match/post], no substrings) or Global search
if(table->columns()->size()>3 || was_global)
result=new(pool) VTable(pool, table/*TODO: clone this when table would be stacked!*/); // table of pre/match/post+substrings
else
result=new(pool) VBool(pool, matched);
r.write_assign_lang(*result);
} else { // replace
const String& src=*r.self->get_string();
Value& replacement_code=params->as_junction(2, "replacement param must be code");
String& result=*new(pool) String(pool);
VTable vtable(pool);
Replace_action_info replace_action_info={
&r, &method_name,
&src, &result,
&vtable,
&replacement_code
};
Temp_value_element temp_match_var(
*replacement_code.get_junction()->method_frame,
*match_var_name, &vtable);
src.match(
&method_name,
r.process_to_string(regexp), options,
&table,
replace_action, &replace_action_info);
r.write_assign_lang(result);
}
}
static void change_case(Request& r, const String& method_name, MethodParams *params,
String::Change_case_kind kind) {
Pool& pool=r.pool();
const String& src=static_cast<VString *>(r.self)->string();
r.write_assign_lang(src.change_case(pool, kind));
}
static void _upper(Request& r, const String& method_name, MethodParams *params) {
change_case(r, method_name, params, String::CC_UPPER);
}
static void _lower(Request& r, const String& method_name, MethodParams *params) {
change_case(r, method_name, params, String::CC_LOWER);
}
#ifndef DOXYGEN
class String_sql_event_handlers : public SQL_Driver_query_event_handlers {
public:
String_sql_event_handlers(Pool& apool,
const String& astatement_string, const char *astatement_cstr) :
pool(apool),
statement_string(astatement_string),
statement_cstr(astatement_cstr),
got_column(false), got_cell(false) {
result=new(pool) String(pool);
}
void add_column(void *ptr, size_t size) {
if(got_column)
throw Exception("parser.runtime",
&statement_string,
"result must contain exactly one column");
got_column=true;
}
void before_rows() { /* ignore */ }
void add_row() { /* ignore */ }
void add_row_cell(void *ptr, size_t size) {
if(got_cell)
throw Exception("parser.runtime",
&statement_string,
"result must not contain more then one row");
got_cell=true;
result->APPEND_TAINTED((const char *)ptr, size, statement_cstr, 0);
}
private:
Pool& pool;
const String& statement_string; const char *statement_cstr;
bool got_column;
public:
bool got_cell;
String *result;
};
#endif
const String* sql_result_string(Request& r, const String& method_name, MethodParams *params,
Hash *& options, Value *& default_code) {
Pool& pool=r.pool();
Value& statement=params->as_junction(0, "statement must be code");
ulong limit=0;
ulong offset=0;
default_code=0;
if(params->size()>1) {
Value& voptions=params->as_no_junction(1, "options must be hash, not code");
if(!voptions.is_string())
if(options=voptions.get_hash(&method_name)) {
if(Value *vlimit=(Value *)options->get(*sql_limit_name))
limit=(ulong)r.process_to_value(*vlimit).as_double();
if(Value *voffset=(Value *)options->get(*sql_offset_name))
offset=(ulong)r.process_to_value(*voffset).as_double();
if(default_code=(Value *)options->get(*sql_default_name)) {
if(Junction *default_junction=default_code->get_junction())
;//default_junction->change_context(statement.get_junction());
else
throw Exception("parser.runtime",
&method_name,
"default option must be code");
}
} else
throw Exception("parser.runtime",
&method_name,
"options must be hash");
} else
options=0;
Temp_lang temp_lang(r, String::UL_SQL);
const String& statement_string=r.process_to_string(statement);
const char *statement_cstr=
statement_string.cstr(String::UL_UNSPECIFIED, r.connection(&method_name));
String_sql_event_handlers handlers(pool, statement_string, statement_cstr);
r.connection(&method_name)->query(
statement_cstr, offset, limit,
handlers,
statement_string);
if(!handlers.got_cell)
return 0; // no lines, caller should return second param[default value]
return handlers.result;
}
static void _sql(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
Hash *options;
Value *default_code;
const String *string=sql_result_string(r, method_name, params, options, default_code);
if(!string) {
if(default_code) {
string=&r.process_to_string(*default_code);
if(!string)
string=new(pool) String(pool);
} else
throw Exception("parser.runtime",
&method_name,
"produced no result, but no default option specified");
}
r.write_assign_lang(*string);
}
static void _replace(Request& r, const String& method_name, MethodParams *params) {
Pool& pool=r.pool();
const String& src=*r.self->get_string();
Table *table=params->as_no_junction(0, "parameter must not be code").get_table();
if(!table)
throw Exception("parser.runtime",
&method_name,
"parameter must be table");
Dictionary dict(*table);
r.write_assign_lang(src.replace(pool, dict));
}
static void _save(Request& r, const String& method_name, MethodParams *params) {
const String& file_name=params->as_string(params->size()-1,
"file name must be string");
const String& src=static_cast<VString *>(r.self)->string();
bool do_append=false;
if(params->size()>1) {
const String& mode=params->as_string(0, "mode must be string");
if(mode=="append")
do_append=true;
else
throw Exception("parser.runtime",
&mode,
"unknown mode, must be 'append'");
}
// write
const char *buf=src.cstr(String::UL_UNSPECIFIED);
file_write(r.absolute(file_name),
buf, strlen(buf), true, do_append);
}
static void _normalize(Request& r, const String& method_name, MethodParams * /*params*/) {
r.write_assign_lang(r.self->get_string()->join_chains(r.pool(), 0/*cstr*/));
}
// constructor
MString::MString(Pool& apool) : Methoded(apool, "string") {
// ^string.length[]
add_native_method("length", Method::CT_DYNAMIC, _length, 0, 0);
// ^string.int[]
// ^string.int(default)
add_native_method("int", Method::CT_DYNAMIC, _int, 0, 1);
// ^string.double[]
// ^string.double(default)
add_native_method("double", Method::CT_DYNAMIC, _double, 0, 1);
// ^string.format{format}
add_native_method("format", Method::CT_DYNAMIC, _string_format, 1, 1);
// ^string.left(n)
add_native_method("left", Method::CT_DYNAMIC, _left, 1, 1);
// ^string.right(n)
add_native_method("right", Method::CT_DYNAMIC, _right, 1, 1);
// ^string.mid(p;n)
add_native_method("mid", Method::CT_DYNAMIC, _mid, 1, 2);
// ^string.pos[substr]
add_native_method("pos", Method::CT_DYNAMIC, _pos, 1, 1);
// ^string.split[delim]
// ^string.split[delim][options]
add_native_method("split", Method::CT_DYNAMIC, _split, 1, 2);
// old names for backward compatibility
// ^string.lsplit[delim]
add_native_method("lsplit", Method::CT_DYNAMIC, _lsplit, 1, 1);
// ^string.rsplit[delim]
add_native_method("rsplit", Method::CT_DYNAMIC, _rsplit, 1, 1);
// ^string.match[regexp][options]
// ^string.match[regexp][options]{replacement-code}
add_native_method("match", Method::CT_DYNAMIC, _match, 1, 3);
// ^string.toupper[]
add_native_method("upper", Method::CT_DYNAMIC, _upper, 0, 0);
// ^string.tolower[]
add_native_method("lower", Method::CT_DYNAMIC, _lower, 0, 0);
// ^sql[query]
// ^sql[query][$.limit(1) $.offset(2) $.default[n/a]]
add_native_method("sql", Method::CT_STATIC, _sql, 1, 2);
// ^string.replace[table]
add_native_method("replace", Method::CT_DYNAMIC, _replace, 1, 1);
// ^string.save[file]
add_native_method("save", Method::CT_DYNAMIC, _save, 1, 2);
// ^string.normalize[]
add_native_method("normalize", Method::CT_DYNAMIC, _normalize, 0, 0);
}
// global variable
Methoded *string_class;
// creator
Methoded *MString_create(Pool& pool) {
return string_class=new(pool) MString(pool);
}
E-mail: