/** @file
Parser: @b string parser class.
Copyright (c) 2001-2004 ArtLebedev Group (http://www.artlebedev.com)
Author: Alexandr Petrosian <paf@design.ru> (http://paf.design.ru)
*/
static const char * const IDENT_STRING_C="$Date: 2004/03/01 08:54:16 $";
#include "classes.h"
#include "pa_vmethod_frame.h"
#include "pa_request.h"
#include "pa_vdouble.h"
#include "pa_vint.h"
#include "pa_vtable.h"
#include "pa_vbool.h"
#include "pa_string.h"
#include "pa_sql_connection.h"
#include "pa_dictionary.h"
#include "pa_vmethod_frame.h"
// class
class MString: public Methoded {
public:
MString();
public: // Methoded
bool used_directly() { return true; }
};
// global variable
DECLARE_CLASS_VAR(string, new MString, 0);
// defines for statics
#define MATCH_VAR_NAME "match"
#define TRIM_START_OPTION "start"
#define TRIM_BOTH_OPTION "both"
#define TRIM_END_OPTION "end"
// statics
static const String match_var_name(MATCH_VAR_NAME);
// methods
static void _length(Request& r, MethodParams&) {
double result=GET_SELF(r, VString).string().length();
r.write_no_lang(*new VDouble(result));
}
static void _int(Request& r, MethodParams& params) {
const String& self_string=GET_SELF(r, VString).string();
int converted;
Value* default_code=params.count()>0?¶ms.as_junction(0, "default must be int")
:0; // (default)
try {
if(self_string.is_empty())
throw Exception("parser.runtime",
0,
"parameter is empty string, error converting");
converted=self_string.as_int();
} catch(...) { // convert problem
if(default_code)
converted=r.process_to_value(*default_code).as_int();
else
rethrow; // we have a problem when no default
}
r.write_no_lang(*new VInt(converted));
}
static void _double(Request& r, MethodParams& params) {
const String& self_string=GET_SELF(r, VString).string();
double converted;
Value* default_code=params.count()>0?¶ms.as_junction(0, "default must be double")
:0; // (default)
try {
if(self_string.is_empty())
throw Exception("parser.runtime",
0,
"parameter is empty string, error converting");
converted=self_string.as_double();
} catch(...) { // convert problem
if(default_code)
converted=r.process_to_value(*default_code).as_double();
else
rethrow; // we have a problem when no default
}
r.write_no_lang(*new VDouble(converted));
}
/*not static*/void _string_format(Request& r, MethodParams& params) {
Value& fmt_maybe_code=params[0];
// for some time due to stupid {} in original design
const String& fmt=r.process_to_string(fmt_maybe_code);
const char* buf=format(r.get_self().as_double(), fmt.cstrm());
r.write_no_lang(String(buf));
}
static void _left(Request& r, MethodParams& params) {
size_t n=(size_t)params.as_int(0, "n must be int", r);
const String& string=GET_SELF(r, VString).string();
r.write_assign_lang(string.mid(0, n));
}
static void _right(Request& r, MethodParams& params) {
size_t n=(size_t)params.as_int(0, "n must be int", r);
const String& string=GET_SELF(r, VString).string();
size_t length=string.length();
r.write_assign_lang(n<length?string.mid(length-n, string.length()):string);
}
static void _mid(Request& r, MethodParams& params) {
const String& string=GET_SELF(r, VString).string();
size_t p=(size_t)max(0, params.as_int(0, "p must be int", r));
size_t n=params.count()>1?
(size_t)max(0, params.as_int(1, "n must be int", r)):string.length();
r.write_assign_lang(string.mid(p, p+n));
}
static void _pos(Request& r, MethodParams& params) {
Value& substr=params.as_no_junction(0, "substr must not be code");
const String& string=GET_SELF(r, VString).string();
r.write_assign_lang(*new VInt((int)string.pos(substr.as_string())));
}
static void split_list(MethodParams& params, int paramIndex,
const String& string,
ArrayString& result) {
Value& delim_value=params.as_no_junction(paramIndex, "delimiter must not be code");
size_t pos_after=0;
string.split(result, pos_after, delim_value.as_string());
}
#define SPLIT_LEFT 0x0001
#define SPLIT_RIGHT 0x0010
#define SPLIT_HORIZONTAL 0x0100
#define SPLIT_VERTICAL 0x1000
static int split_options(const String* options) {
struct Split_option {
const char* keyL;
const char* keyU;
int setBit;
int checkBit;
} split_option[]={
{"l", "L", SPLIT_LEFT, SPLIT_RIGHT}, // 0xVHRL
{"r", "R", SPLIT_RIGHT, SPLIT_LEFT},
{"h", "H", SPLIT_HORIZONTAL, SPLIT_VERTICAL},
{"v", "V", SPLIT_VERTICAL, SPLIT_HORIZONTAL},
{0, 0, 0, 0}
};
int result=0;
if(options) {
for(Split_option *o=split_option; o->keyL; o++)
if(options->pos(o->keyL)!=STRING_NOT_FOUND
|| (o->keyU && options->pos(o->keyU)!=STRING_NOT_FOUND)) {
if(result & o->checkBit)
throw Exception("parser.runtime",
options,
"conflicting split options");
result |= o->setBit;
}
}
return result;
}
static Table& split_vertical(ArrayString& pieces, bool right) {
Table::columns_type columns(new ArrayString);
*columns+=new String("piece");
Table& table=*new Table(columns, pieces.count());
if(right) { // right
for(int i=pieces.count(); --i>=0; ) {
Table::element_type row(new ArrayString);
*row+=pieces[i];
table+=row;
}
} else { // left
Array_iterator<const String*> i(pieces);
while(i.has_next()) {
Table::element_type row(new ArrayString);
*row+=i.next();
table+=row;
}
}
return table;
}
static Table& split_horizontal(ArrayString& pieces, bool right) {
Table& table=*new Table(Table::columns_type(0) /* nameless */);
Table::element_type row(new ArrayString(pieces.count()));
if(right) { // right
for(int i=pieces.count(); --i>=0; )
*row+=pieces[i];
} else { // left
for(Array_iterator<const String*> i(pieces); i.has_next(); )
*row+=i.next();
}
table+=row;
return table;
}
static void split_with_options(Request& r, MethodParams& params,
int bits) {
const String& string=GET_SELF(r, VString).string();
ArrayString pieces;
split_list(params, 0, string, pieces);
if(!bits) {
const String* options=0;
if(params.count()>1)
options=¶ms.as_string(1, "options must not be code");
bits=split_options(options);
}
bool right=(bits & SPLIT_RIGHT) != 0;
bool horizontal=(bits & SPLIT_HORIZONTAL) !=0;
Table& table=horizontal?split_horizontal(pieces, right)
:split_vertical(pieces, right);
r.write_no_lang(*new VTable(&table));
}
static void _split(Request& r, MethodParams& params) {
split_with_options(r, params, 0 /* maybe-determine from param #2 */);
}
static void _lsplit(Request& r, MethodParams& params) {
split_with_options(r, params, SPLIT_LEFT);
}
static void _rsplit(Request& r, MethodParams& params) {
split_with_options(r, params, SPLIT_RIGHT);
}
static void search_action(Table& table, Table::element_type row, int, int, int, int, void *) {
if(row)
table+=row;
}
#ifndef DOXYGEN
struct Replace_action_info {
Request* request;
const String* src; String* dest;
VTable* vtable;
Value* replacement_code;
};
#endif
/// @todo they can do $global[$result] there, getting pointer to later-invalid local var, kill this
static void replace_action(Table& table, ArrayString* row,
int prestart, int prefinish,
int poststart, int postfinish,
void *info) {
Replace_action_info& ai=*static_cast<Replace_action_info *>(info);
if(row) { // begin&middle
// piece from last match['prestart'] to beginning of this match['prefinish']
if(prestart!=prefinish)
*ai.dest << ai.src->mid(prestart, prefinish);//ai.dest->APPEND_CONST("-");
// store found parts in one-record VTable
if(table.count()) // middle
table.put(0, row);
else // begin
table+=row;
{ // execute 'replacement_code' in 'table' context
ai.vtable->set_table(table);
*ai.dest << ai.request->process_to_string(*ai.replacement_code);
}
} else // end
*ai.dest << ai.src->mid(poststart, postfinish);
}
/// @todo use pcre:study somehow
static void _match(Request& r, MethodParams& params) {
Value& regexp=params.as_no_junction(0, "regexp must not be code");
const String* options=
params.count()>1?
¶ms.as_no_junction(1, "options must not be code").as_string():0;
Temp_lang temp_lang(r, String::L_PASS_APPENDED);
const String& src=GET_SELF(r, VString).string();
bool just_matched;
if(params.count()<3) { // search
Table* table=src.match(r.charsets.source(),
regexp.as_string(), options,
search_action, 0,
just_matched);
Value* result;
if(table)
result=new VTable(table); // table of pre/match/post+substrings
else
result=new VBool(just_matched);
r.write_assign_lang(*result);
} else { // replace
Value& replacement_code=params.as_junction(2, "replacement param must be code");
String result;
VTable* vtable=new VTable;
Replace_action_info info={
&r,
&src,
&result,
vtable,
&replacement_code
};
Temp_value_element temp_match_var(
*replacement_code.get_junction()->method_frame,
match_var_name, vtable);
src.match(r.charsets.source(),
r.process_to_string(regexp), options,
replace_action, &info,
just_matched);
r.write_assign_lang(result);
}
}
static void change_case(Request& r, MethodParams&,
String::Change_case_kind kind) {
const String& src=GET_SELF(r, VString).string();
r.write_assign_lang(src.change_case(r.charsets.source(), kind));
}
static void _upper(Request& r, MethodParams& params) {
change_case(r, params, String::CC_UPPER);
}
static void _lower(Request& r, MethodParams& params) {
change_case(r, params, String::CC_LOWER);
}
#ifndef DOXYGEN
class String_sql_event_handlers: public SQL_Driver_query_event_handlers {
const String& statement_string; const char* statement_cstr;
bool got_column;
public:
bool got_cell;
String& result;
public:
String_sql_event_handlers(
const String& astatement_string, const char* astatement_cstr):
statement_string(astatement_string), statement_cstr(astatement_cstr),
got_column(false),
got_cell(false),
result(*new String) {}
bool add_column(SQL_Error& error, const char* /*str*/, size_t /*length*/) {
if(got_column) {
error=SQL_Error("parser.runtime",
//statement_string,
"result must contain exactly one column");
return true;
}
got_column=true;
return false;
}
bool before_rows(SQL_Error& /*error*/ ) { /* ignore */ return false; }
bool add_row(SQL_Error& /*error*/) { /* ignore */ return false; }
bool add_row_cell(SQL_Error& error, const char* str, size_t length) {
if(got_cell) {
error=SQL_Error("parser.runtime",
//statement_string,
"result must not contain more then one row");
return true;
}
try {
got_cell=true;
result.append_know_length(str, length, String::L_TAINTED);
return false;
} catch(...) {
error=SQL_Error("exception occured in String_sql_event_handlers::add_row_cell");
return true;
}
}
};
#endif
extern String sql_limit_name;
extern String sql_offset_name;
extern String sql_default_name;
extern String sql_distinct_name;
const String* sql_result_string(Request& r, MethodParams& params,
HashStringValue*& options, Value*& default_code) {
Value& statement=params.as_junction(0, "statement must be code");
ulong limit=0;
ulong offset=0;
default_code=0;
if(params.count()>1) {
Value& voptions=params.as_no_junction(1, "options must be hash, not code");
if(!voptions.is_string())
if((options=voptions.get_hash())) {
if(Value* vlimit=options->get(sql_limit_name))
limit=(ulong)r.process_to_value(*vlimit).as_double();
if(Value* voffset=options->get(sql_offset_name))
offset=(ulong)r.process_to_value(*voffset).as_double();
if((default_code=options->get(sql_default_name))) {
if(!default_code->get_junction())
throw Exception("parser.runtime",
0,
"default option must be code");
}
} else
throw Exception("parser.runtime",
0,
"options must be hash");
} else
options=0;
Temp_lang temp_lang(r, String::L_SQL);
const String& statement_string=r.process_to_string(statement);
const char* statement_cstr=
statement_string.cstr(String::L_UNSPECIFIED, r.connection());
String_sql_event_handlers handlers(statement_string, statement_cstr);
r.connection()->query(
statement_cstr, offset, limit,
handlers,
statement_string);
if(!handlers.got_cell)
return 0; // no lines, caller should return second param[default value]
return &handlers.result;
}
static void _sql(Request& r, MethodParams& params) {
HashStringValue* options;
Value* default_code;
const String* string=sql_result_string(r, params, options, default_code);
if(!string) {
if(default_code) {
string=&r.process_to_string(*default_code);
} else
throw Exception("parser.runtime",
0,
"produced no result, but no default option specified");
}
r.write_assign_lang(*string);
}
static void _replace(Request& r, MethodParams& params) {
const String& src=GET_SELF(r, VString).string();
Table* table=params.as_no_junction(0, "parameter must not be code").get_table();
if(!table)
throw Exception("parser.runtime",
0,
"parameter must be table");
Dictionary dict(*table);
r.write_assign_lang(src.replace(dict));
}
static void _save(Request& r, MethodParams& params) {
const String& file_name=params.as_string(params.count()-1,
"file name must be string");
const String& src=GET_SELF(r, VString).string();
bool do_append=false;
if(params.count()>1) {
const String& mode=params.as_string(0, "mode must be string");
if(mode=="append")
do_append=true;
else
throw Exception("parser.runtime",
&mode,
"unknown mode, must be 'append'");
}
// write
const char* buf=src.cstr(String::L_UNSPECIFIED, r.connection(false/*no error if none*/));
file_write(r.absolute(file_name),
buf, strlen(buf), true, do_append);
}
static void _normalize(Request& r, MethodParams&) {
const String& src=GET_SELF(r, VString).string();
r.write_assign_lang(src);
}
static void _trim(Request& r, MethodParams& params) {
const String& src=GET_SELF(r, VString).string();
String::Trim_kind kind=String::TRIM_BOTH;
const char* chars=0;
if(params.count()>0) {
const String& skind=params.as_string(0,
"'where' must be string");
if(skind==TRIM_START_OPTION)
kind=String::TRIM_START;
else if(skind==TRIM_END_OPTION)
kind=String::TRIM_END;
else if(skind==TRIM_BOTH_OPTION)
kind=String::TRIM_BOTH;
else
throw Exception("parser.runtime",
&skind,
"'kind' should be one of "TRIM_START_OPTION", "TRIM_BOTH_OPTION", "TRIM_END_OPTION);
if(params.count()>1) {
const String& schars=params.as_string(1, "'chars' must be string");
if(!schars.length())
throw Exception("parser.runtime",
0,
"'chars' must not be empty");
chars=schars.cstr();
}
}
r.write_assign_lang(src.trim(kind, chars));
}
// constructor
MString::MString(): Methoded("string") {
// ^string.length[]
add_native_method("length", Method::CT_DYNAMIC, _length, 0, 0);
// ^string.int[]
// ^string.int(default)
add_native_method("int", Method::CT_DYNAMIC, _int, 0, 1);
// ^string.double[]
// ^string.double(default)
add_native_method("double", Method::CT_DYNAMIC, _double, 0, 1);
// ^string.format{format}
add_native_method("format", Method::CT_DYNAMIC, _string_format, 1, 1);
// ^string.left(n)
add_native_method("left", Method::CT_DYNAMIC, _left, 1, 1);
// ^string.right(n)
add_native_method("right", Method::CT_DYNAMIC, _right, 1, 1);
// ^string.mid(p;n)
add_native_method("mid", Method::CT_DYNAMIC, _mid, 1, 2);
// ^string.pos[substr]
add_native_method("pos", Method::CT_DYNAMIC, _pos, 1, 1);
// ^string.split[delim]
// ^string.split[delim][options]
add_native_method("split", Method::CT_DYNAMIC, _split, 1, 2);
// old names for backward compatibility
// ^string.lsplit[delim]
add_native_method("lsplit", Method::CT_DYNAMIC, _lsplit, 1, 1);
// ^string.rsplit[delim]
add_native_method("rsplit", Method::CT_DYNAMIC, _rsplit, 1, 1);
// ^string.match[regexp][options]
// ^string.match[regexp][options]{replacement-code}
add_native_method("match", Method::CT_DYNAMIC, _match, 1, 3);
// ^string.toupper[]
add_native_method("upper", Method::CT_DYNAMIC, _upper, 0, 0);
// ^string.tolower[]
add_native_method("lower", Method::CT_DYNAMIC, _lower, 0, 0);
// ^sql[query]
// ^sql[query][$.limit(1) $.offset(2) $.default[n/a]]
add_native_method("sql", Method::CT_STATIC, _sql, 1, 2);
// ^string.replace[table]
add_native_method("replace", Method::CT_DYNAMIC, _replace, 1, 1);
// ^string.save[file]
add_native_method("save", Method::CT_DYNAMIC, _save, 1, 2);
// ^string.normalize[]
add_native_method("normalize", Method::CT_DYNAMIC, _normalize, 0, 0);
// ^string.trim[[start|both|end][;chars]]
add_native_method("trim", Method::CT_DYNAMIC, _trim, 0, 2);
}
E-mail: