--- parser3/src/classes/file.C 2002/09/10 10:55:32 1.97 +++ parser3/src/classes/file.C 2003/04/04 14:42:38 1.110 @@ -1,11 +1,13 @@ /** @file Parser: @b file parser class. - Copyright (c) 2001, 2002 ArtLebedev Group (http://www.artlebedev.com) + Copyright (c) 2001, 2003 ArtLebedev Group (http://www.artlebedev.com) Author: Alexandr Petrosian (http://paf.design.ru) + + portions by Victor Fedoseev" [January 23, 2003] */ -static const char* IDENT_FILE_C="$Date: 2002/09/10 10:55:32 $"; +static const char* IDENT_FILE_C="$Date: 2003/04/04 14:42:38 $"; #include "pa_config_includes.h" @@ -21,11 +23,13 @@ static const char* IDENT_FILE_C="$Date: #include "pa_dir.h" #include "pa_vtable.h" #include "pa_charset.h" +#include "pa_charsets.h" // defines #define TEXT_MODE_NAME "text" #define STDIN_EXEC_PARAM_NAME "stdin" +#define CHARSET_EXEC_PARAM_NAME "charset" // consts @@ -95,7 +99,7 @@ static void _save(Request& r, const Stri Value& vfile_name=params->as_no_junction(1, "file name must not be code"); // save - static_cast(r.self)->save(r.absolute(vfile_name.as_string()), + static_cast(r.get_self())->save(r.absolute(vfile_name.as_string()), vmode_name.as_string()==TEXT_MODE_NAME); } @@ -116,21 +120,42 @@ static void _move(Request& r, const Stri r.absolute(vto_file_name.as_string())); } +static void _load_pass_param(const Hash::Key& key, Hash::Val *value, void *info) { + Hash& dest=*static_cast(info); + dest.put(key, value); +} static void _load(Request& r, const String& method_name, MethodParams *params) { Pool& pool=r.pool(); Value& vmode_name=params-> as_no_junction(0, "mode must not be code"); const String& lfile_name=r.absolute(params->as_no_junction(1, "file name must not be code").as_string()); + Value *third_param=params->size()>2?¶ms->as_no_junction(2, "filename or options must not be code"):0; + Hash *third_param_hash=third_param?third_param->get_hash(&method_name):0; + int alt_filename_param_index=2; + if(third_param_hash) + alt_filename_param_index++; void *data; size_t size; + Hash *fields=0; file_read(pool, lfile_name, data, size, - vmode_name.as_string()==TEXT_MODE_NAME); + vmode_name.as_string()==TEXT_MODE_NAME, + third_param_hash, + &fields + ); - char *user_file_name=params->size()>2? - params->as_string(2, "filename must be string").cstr(String::UL_FILE_SPEC) + char *user_file_name=params->size()>alt_filename_param_index? + params->as_string(alt_filename_param_index, "filename must be string").cstr(String::UL_FILE_SPEC) :lfile_name.cstr(String::UL_FILE_SPEC); + + Value *vcontent_type=0; + if(fields) + vcontent_type=static_cast(fields->get(*content_type_name)); + if(!vcontent_type) + vcontent_type=new(pool) VString(r.mime_type_of(user_file_name)); - static_cast(r.self)->set(true/*tainted*/, data, size, - user_file_name, new(pool) VString(r.mime_type_of(user_file_name))); + VFile& self=*static_cast(r.get_self()); + self.set(true/*tainted*/, data, size, user_file_name, vcontent_type); + if(fields) + fields->for_each(_load_pass_param, &self.fields()); } static void _stat(Request& r, const String& method_name, MethodParams *params) { @@ -145,7 +170,7 @@ static void _stat(Request& r, const Stri size, atime, mtime, ctime); - VFile& vfile=*static_cast(r.self); + VFile& vfile=*static_cast(r.get_self()); vfile.set(true/*tainted*/, 0/*no bytes*/, size); Hash& ff=vfile.fields(); ff.put(*new(pool) String(pool, "adate"), new(pool) VDate(pool, atime)); @@ -168,21 +193,24 @@ static bool is_safe_env_key(const char * #ifndef DOXYGEN struct Append_env_pair_info { Hash* hash; - const String* sstdin; + Value* vstdin; + Value* vcharset; }; #endif -static void append_env_pair(const Hash::Key& key, Hash::Val *value, void *info) { +static void append_env_pair(const Hash::Key& key, Hash::Val *avalue, void *info) { Append_env_pair_info& pi=*static_cast(info); - const String& svalue=static_cast(value)->as_string(); + Value& value=*static_cast(avalue); if(key==STDIN_EXEC_PARAM_NAME) { - pi.sstdin=&svalue; + pi.vstdin=&value; + } else if(key==CHARSET_EXEC_PARAM_NAME) { + pi.vcharset=&value; } else { if(!is_safe_env_key(key.cstr())) throw Exception("parser.runtime", &key, "not safe environment variable"); - pi.hash->put(key, &svalue); + pi.hash->put(key, &value.as_string()); } } #ifndef DOXYGEN @@ -249,14 +277,29 @@ static void _exec_cgi(Request& r, const //env.put(*new(pool) String(pool, "SCRIPT_FILENAME"), ??&script_name); // environment & stdin from param - String in(pool); + String raw_in(pool); + Charset *charset=0; // default script works raw_in 'source' charset = no transcoding needed if(params->size()>1) { Value& venv=params->as_no_junction(1, "env must not be code"); if(Hash *user_env=venv.get_hash(&method_name)) { Append_env_pair_info info={&env}; user_env->for_each(append_env_pair, &info); - if(info.sstdin) - in.append(*info.sstdin, String::UL_CLEAN, true); + // $.stdin + if(info.vstdin) { + if(const String *sstdin=info.vstdin->get_string()) { + raw_in.append(*sstdin, String::UL_CLEAN, true); + } else + if(VFile *vfile=static_cast(info.vstdin->as("file", false))) + raw_in.APPEND_TAINTED((const char *)vfile->value_ptr(), vfile->value_size(), + "$.stdin[assigned]", 0); + else + throw Exception("parser.runtime", + &method_name, + STDIN_EXEC_PARAM_NAME " parameter must be string or file"); + } + // $.charset + if(info.vcharset) + charset=&charsets->get_charset(info.vcharset->as_string()); } } @@ -268,48 +311,63 @@ static void _exec_cgi(Request& r, const *argv+=¶ms->as_string(i, "parameter must be string"); } - // passing POST data - if(in.is_empty()) // if $.stdin[...] not specified - in.APPEND(r.post_data, r.post_size, String::UL_CLEAN, "POST data (passed)", 0); + // transcode if necessary + String* real_in=&raw_in; + if(charset) { + Charset::transcode(pool, pool.get_source_charset(), *charset, env); + if(argv) + Charset::transcode(pool, pool.get_source_charset(), *charset, *argv); + real_in=&Charset::transcode(pool, pool.get_source_charset(), *charset, raw_in); + } // exec! - String out(pool); - String& err=*new(pool) String(pool); - int status=pa_exec(false/*forced_allow*/, script_name, &env, argv, in, out, err); - - VFile& self=*static_cast(r.self); - - const String *body=&out; // ^file:exec - Value *content_type=0; - const char *eol_marker="\r\n"; size_t eol_marker_size=2; + String raw_out(pool); + String& raw_err=*new(pool) String(pool); + int status=0; + + const String *body=0; const String *header=0; + const char *eol_marker=0; size_t eol_marker_size; int header_break_pos; + + String *real_out=&raw_out; + String *real_err=&raw_err; if(cgi) { // ^file:cgi - // construct with 'out' body and header - int delim_size; - int pos=out.pos("\r\n\r\n", delim_size=4); - if(pos<0) { - eol_marker="\n"; eol_marker_size=1; - pos=out.pos("\n\n", delim_size=2); + status = pa_exec(false/*forced_allow*/, script_name, &env, argv, *real_in, raw_out, raw_err, &header_break_pos, &eol_marker, &eol_marker_size); + // transcode if necessary + if(charset) { + real_out=&Charset::transcode(pool, *charset, pool.get_source_charset(), raw_out); + real_err=&Charset::transcode(pool, *charset, pool.get_source_charset(), raw_err); } - if(pos<0) { - delim_size=0; // calm down, compiler + if(header_break_pos == -1) throw Exception(0, &method_name, "output does not contain CGI header; " "exit status=%d; stdoutsize=%u; stdout: \"%s\"; stderrsize=%u; stderr: \"%s\"", status, - (uint)out.size(), out.cstr(), - (uint)err.size(), err.cstr()); - } + (uint)real_out->size(), real_out->cstr(), + (uint)real_err->size(), real_err->cstr()); - header=&out.mid(0, pos); - body=&out.mid(pos+delim_size, out.size()); + header=&real_out->mid(0, header_break_pos); + body=&real_out->mid(header_break_pos+eol_marker_size*2, real_out->size()); + }else{ // ^file:exec + status = pa_exec(false/*forced_allow*/, script_name, &env, argv, *real_in, raw_out, raw_err); + // transcode if necessary + if(charset) { + real_out=&Charset::transcode(pool, *charset, pool.get_source_charset(), raw_out); + real_err=&Charset::transcode(pool, *charset, pool.get_source_charset(), raw_err); + } + body=real_out; } + + + + VFile& self=*static_cast(r.get_self()); + // body self.set(false/*not tainted*/, body->cstr(), body->size()); // $fields << header - if(header) { + if(header && eol_marker) { Array rows(pool); header->split(rows, 0, eol_marker, eol_marker_size); Pass_cgi_header_attribute_info info={&self.fields()}; @@ -320,14 +378,14 @@ static void _exec_cgi(Request& r, const // $status self.fields().put( - *new(pool) String(pool, "status"), + *file_status_name, new(pool) VInt(pool, status)); // $stderr - if(err.size()) { + if(real_err->size()) { self.fields().put( *new(pool) String(pool, "stderr"), - new(pool) VString(err)); + new(pool) VString(*real_err)); } } static void _exec(Request& r, const String& method_name, MethodParams *params) { @@ -394,7 +452,7 @@ static void _list(Request& r, const Stri char *file_name_cstr=(char *)pool.malloc(file_name_size); memcpy(file_name_cstr, ffblk.ff_name, file_name_size); String &file_name=*new(pool) String(pool); - file_name.APPEND(file_name_cstr, file_name_size, String::UL_FILE_SPEC, + file_name.APPEND_TAINTED(file_name_cstr, file_name_size, method_name.origin().file, method_name.origin().line); Array& row=*new(pool) Array(pool); @@ -518,6 +576,26 @@ static void _justext(Request& r, const S r.write_assign_lang(file_spec.mid(afterdot, file_spec.size())); } +static void _fullpath(Request& r, const String& method_name, MethodParams *params) { + const String& file_spec=params->as_string(0, "file name must be string"); + const String *result; + if(file_spec.first_char()=='/') + result=&file_spec; + else { + // /some/page.html: ^file:fullpath[a.gif] => /some/a.gif + const String& full_disk_path=r.absolute(file_spec); + size_t document_root_length=strlen(r.info.document_root); + + if(document_root_length>0) { + char last_char=r.info.document_root[document_root_length-1]; + if(last_char == '/' || last_char == '\\') + --document_root_length; + } + result=&full_disk_path.mid(document_root_length, full_disk_path.size()); + } + r.write_assign_lang(*result); +} + // constructor @@ -568,6 +646,8 @@ MFile::MFile(Pool& apool) : Methoded(apo add_native_method("justname", Method::CT_STATIC, _justname, 1, 1); // ^file:justext[/a/some.tar.gz]=gz add_native_method("justext", Method::CT_STATIC, _justext, 1, 1); + // /some/page.html: ^file:fullpath[a.gif] => /some/a.gif + add_native_method("fullpath", Method::CT_STATIC, _fullpath, 1, 1); } // global variable