--- parser3/src/classes/xdoc.C 2001/09/26 15:43:59 1.2 +++ parser3/src/classes/xdoc.C 2016/04/06 16:08:19 1.185 @@ -1,409 +1,774 @@ /** @file Parser: @b xdoc parser class. - Copyright (c) 2001 ArtLebedev Group (http://www.artlebedev.com) - Author: Alexander Petrosyan (http://design.ru/paf) - - $Id: xdoc.C,v 1.2 2001/09/26 15:43:59 parser Exp $ + Copyright (c) 2001-2015 Art. Lebedev Studio (http://www.artlebedev.com) + Author: Alexandr Petrosian (http://paf.design.ru) */ -#include "classes.h" + +#include "pa_config_includes.h" + #ifdef XML +#include "libxml/tree.h" +#include "libxml/HTMLtree.h" +#include "libxslt/xsltInternals.h" +#include "libxslt/transform.h" +#include "libxslt/xsltutils.h" +#include "libxslt/variables.h" +#include "libxslt/imports.h" + +#include "pa_vmethod_frame.h" + +#include "pa_stylesheet_manager.h" #include "pa_request.h" #include "pa_vxdoc.h" -#include "pa_xslt_stylesheet_manager.h" -#include "pa_stylesheet_connection.h" +#include "pa_charset.h" #include "pa_vfile.h" +#include "pa_xml_exception.h" #include "xnode.h" +#include "pa_charsets.h" -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include -#include +volatile const char * IDENT_XDOC_C="$Id: xdoc.C,v 1.185 2016/04/06 16:08:19 moko Exp $"; // defines #define XDOC_CLASS_NAME "xdoc" -#define XDOC_OUTPUT_METHOD_OPTION_NAME "method" -#define XDOC_OUTPUT_METHOD_OPTION_VALUE_XML "xml" -#define XDOC_OUTPUT_METHOD_OPTION_VALUE_HTML "html" -#define XDOC_OUTPUT_METHOD_OPTION_VALUE_TEXT "text" - -#define XDOC_OUTPUT_ENCODING_OPTION_NAME "encoding" - -#define XDOC_OUTPUT_DEFAULT_INDENT 4 - // class -class MXdoc : public MXnode { +class MXdoc: public MXnode { public: // VStateless_class - Value *create_new_value(Pool& pool) { return new(pool) VXdoc(pool); } + Value* create_new_value(Pool&) { return new VXdoc(); } public: - MXdoc(Pool& pool); + MXdoc(); -public: // Methoded - bool used_directly() { return true; } }; -// methods +// global variable -class ParserStringXalanOutputStream: public XalanOutputStream { -public: - - explicit ParserStringXalanOutputStream(String& astring) : fstring(astring) {} +DECLARE_CLASS_VAR(xdoc, new MXdoc); -protected: // XalanOutputStream +// helper classes - virtual void writeData(const char *theBuffer, unsigned long theBufferLength) { - char *copy=(char *)fstring.malloc((size_t)theBufferLength); - memcpy(copy, theBuffer, (size_t)theBufferLength); - fstring.APPEND_CLEAN(copy, (size_t)theBufferLength, "xdoc", 0); - } +class xmlOutputBuffer_auto_ptr { +public: + explicit xmlOutputBuffer_auto_ptr(xmlOutputBuffer *_APtr = 0) + : _Owns(_APtr != 0), _Ptr(_APtr) {} + xmlOutputBuffer_auto_ptr(const xmlOutputBuffer_auto_ptr& _Y) + : _Owns(_Y._Owns), _Ptr(_Y.release()) {} + xmlOutputBuffer_auto_ptr& operator=(const xmlOutputBuffer_auto_ptr& _Y) + {if (this != &_Y) + {if (_Ptr != _Y.get()) + {if (_Owns && _Ptr) + xmlOutputBufferClose(_Ptr); + _Owns = _Y._Owns; } + else if (_Y._Owns) + _Owns = true; + _Ptr = _Y.release(); } + return (*this); } + ~xmlOutputBuffer_auto_ptr() + {if (_Owns && _Ptr) + xmlOutputBufferClose(_Ptr); } + xmlOutputBuffer& operator*() const + {return (*get()); } + xmlOutputBuffer *operator->() const + {return (get()); } + xmlOutputBuffer *get() const + {return (_Ptr); } + xmlOutputBuffer *release() const + {((xmlOutputBuffer_auto_ptr *)this)->_Owns = false; + return (_Ptr); } +private: + bool _Owns; + xmlOutputBuffer *_Ptr; +}; - virtual void doFlush() {} +class xsltTransformContext_auto_ptr { +public: + explicit xsltTransformContext_auto_ptr(xsltTransformContext *_APtr = 0) + : _Owns(_APtr != 0), _Ptr(_APtr) {} + xsltTransformContext_auto_ptr(const xsltTransformContext_auto_ptr& _Y) + : _Owns(_Y._Owns), _Ptr(_Y.release()) {} + xsltTransformContext_auto_ptr& operator=(const xsltTransformContext_auto_ptr& _Y) + {if (this != &_Y) + {if (_Ptr != _Y.get()) + {if (_Owns && _Ptr) + xsltFreeTransformContext(_Ptr); + _Owns = _Y._Owns; } + else if (_Y._Owns) + _Owns = true; + _Ptr = _Y.release(); } + return (*this); } + ~xsltTransformContext_auto_ptr() + {if (_Owns && _Ptr) + xsltFreeTransformContext(_Ptr); } + xsltTransformContext& operator*() const + {return (*get()); } + xsltTransformContext *operator->() const + {return (get()); } + xsltTransformContext *get() const + {return (_Ptr); } + xsltTransformContext *release() const + {((xsltTransformContext_auto_ptr *)this)->_Owns = false; + return (_Ptr); } +private: + bool _Owns; + xsltTransformContext *_Ptr; +}; +class xsltStylesheet_auto_ptr { +public: + explicit xsltStylesheet_auto_ptr(xsltStylesheet *_APtr = 0) + : _Owns(_APtr != 0), _Ptr(_APtr) {} + xsltStylesheet_auto_ptr(const xsltStylesheet_auto_ptr& _Y) + : _Owns(_Y._Owns), _Ptr(_Y.release()) {} + xsltStylesheet_auto_ptr& operator=(const xsltStylesheet_auto_ptr& _Y) + {if (this != &_Y) + {if (_Ptr != _Y.get()) + {if (_Owns && _Ptr) + xsltFreeStylesheet(_Ptr); + _Owns = _Y._Owns; } + else if (_Y._Owns) + _Owns = true; + _Ptr = _Y.release(); } + return (*this); } + ~xsltStylesheet_auto_ptr() + {if (_Owns && _Ptr) + xsltFreeStylesheet(_Ptr); } + xsltStylesheet& operator*() const + {return (*get()); } + xsltStylesheet *operator->() const + {return (get()); } + xsltStylesheet *get() const + {return (_Ptr); } + xsltStylesheet *release() const + {((xsltStylesheet_auto_ptr *)this)->_Owns = false; + return (_Ptr); } private: + bool _Owns; + xsltStylesheet *_Ptr; +}; - String& fstring; - +// methods + +static void writeNode(Request& r, VXdoc& xdoc, xmlNode* node) { + if(!node) + throw Exception(PARSER_RUNTIME, + 0, + "error creating node"); // OOM, bad name, things like that + + // write out result + r.write_no_lang(xdoc.wrap(*node)); +} + +struct IdsIteratorInfo { + xmlChar *elementId; + xmlNode *element; }; -static void create_optioned_listener( - const char *& content_type, const char *& charset, FormatterListener *& listener, - Pool& pool, - const String& method_name, MethodParams *params, int index, Writer& writer) { - // default encoding from pool - const String *scharset=&pool.get_charset(); - const String *method=0; - XalanDOMString xalan_encoding; - - if(params->size()>index) { - Value& voptions=params->as_no_junction(index, "options must not be code"); - if(voptions.is_defined()) { - if(Hash *options=voptions.get_hash()) { - // $.method[xml|html|text] - if(Value *vmethod=static_cast(options->get(*new(pool) - String(pool, XDOC_OUTPUT_METHOD_OPTION_NAME)))) - method=&vmethod->as_string(); - - // $.encoding[windows-1251|...] - if(Value *vencoding=static_cast(options->get(*new(pool) - String(pool, XDOC_OUTPUT_ENCODING_OPTION_NAME)))) { - scharset=&vencoding->as_string(); - } - } else - PTHROW(0, 0, - &method_name, - "options must be hash"); - } +/* Hash Scanner function for pa_getElementById */ +extern "C" void // switching to calling convetion of libxml +idsHashScanner (void *payload, void *data, xmlChar *name) { + IdsIteratorInfo *priv = (IdsIteratorInfo *)data; + + if (priv->element == NULL && xmlStrEqual (name, priv->elementId)) + { + xmlNode* parent=((xmlID *)payload)->attr->parent; + assert(parent); + priv->element=parent; } +} + +static xmlNode* +pa_getElementById(xmlDoc& xmldoc, xmlChar* elementId) { + xmlHashTable *ids = (xmlHashTable *)xmldoc.ids; + IdsIteratorInfo iter={elementId, NULL}; + xmlHashScan(ids, idsHashScanner, &iter); + return iter.element; +} + +/* +static xmlNode * +pa_importNode (xmlDoc& xmldoc, xmlNode& importedNode, bool deep) { + xmlNode *result = NULL; + + switch (importedNode.type) { + case XML_ATTRIBUTE_NODE: + result = (xmlNode *)xmlCopyProp(xmldoc, (xmlAttr *)importedNode); + result.parent=0; // no idea + break; + case XML_DOCUMENT_FRAG_NODE: + case XML_ELEMENT_NODE: + case XML_ENTITY_REF_NODE: + case XML_PI_NODE: + case XML_TEXT_NODE: + case XML_CDATA_SECTION_NODE: + case XML_COMMENT_NODE: + result = xmlCopyNode (importedNode->n, deep); + xmlSetTreeDoc (result, priv->n); + break; + default: + *exc = GDOME_NOT_SUPPORTED_ERR; + } + + return result; +} +*/ - xalan_encoding.append(charset=scharset->cstr()); - if(!method/*default='xml'*/ || *method == XDOC_OUTPUT_METHOD_OPTION_VALUE_XML) { - content_type="text/xml"; - listener=new FormatterToXML(writer, - XalanDOMString(), // version - true, // doIndent - XDOC_OUTPUT_DEFAULT_INDENT, // indent - xalan_encoding // encoding - ); - } else if(*method == XDOC_OUTPUT_METHOD_OPTION_VALUE_HTML) { - content_type="text/html"; - listener=new FormatterToHTML(writer, - xalan_encoding, // encoding - XalanDOMString(), // mediaType - XalanDOMString(), // doctypeSystem; String to be printed at the top of the document - XalanDOMString(), // doctypePublic - true, // doIndent - XDOC_OUTPUT_DEFAULT_INDENT // indent - ); - } else if(*method == XDOC_OUTPUT_METHOD_OPTION_VALUE_TEXT) { - content_type="text/plain"; - listener=new FormatterToText(writer, - xalan_encoding // encoding - ); +// Element createElement(in DOMString tagName) raises(DOMException); +static void _createElement(Request& r, MethodParams& params) { + xmlChar* tagName=as_xmlname(r, params, 0, "tagName must be string"); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlNewDocNode(&xmldoc, NULL, tagName, NULL); + writeNode(r, vdoc, node); +} + +// Element createElementNS(in DOMString namespaceURI, in DOMString qualifiedName) raises(DOMException); +static void _createElementNS(Request& r, MethodParams& params) { + xmlChar* namespaceURI=as_xmlnsuri(r, params, 0); + xmlChar* qualifiedName=as_xmlqname(r, params, 1); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlChar* prefix=0; + xmlChar* localName=xmlSplitQName2(qualifiedName, &prefix); + + xmlNode *node; + if(localName) { + xmlNs& ns=pa_xmlMapNs(xmldoc, namespaceURI, prefix); + node=xmlNewDocNode(&xmldoc, &ns, localName, NULL); } else - PTHROW(0, 0, - method, - XDOC_OUTPUT_METHOD_OPTION_NAME " option is invalid; valid methods are: " - "'" XDOC_OUTPUT_METHOD_OPTION_VALUE_XML "', " - "'" XDOC_OUTPUT_METHOD_OPTION_VALUE_HTML "', " - "'" XDOC_OUTPUT_METHOD_OPTION_VALUE_TEXT "'"); - - // never reached + node=xmlNewDocNode(&xmldoc, NULL, qualifiedName/*unqualified, actually*/, NULL); + writeNode(r, vdoc, node); } -static void _save(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXnode& vnode=*static_cast(r.self); +// DocumentFragment createDocumentFragment() +static void _createDocumentFragment(Request& r, MethodParams&) { + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); - // filespec - const String& file_name=params->as_string(0, "file name must not be code"); - const char *filespec=r.absolute(file_name).cstr(String::UL_FILE_SPEC); - - // node - XalanNode& node=vnode.get_node(pool, &method_name); + xmlNode *node=xmlNewDocFragment(&xmldoc); + writeNode(r, vdoc, node); +} - try { - XalanFileOutputStream stream(XalanDOMString(filespec, strlen(filespec))); - XalanOutputStreamPrintWriter writer(stream); - const char *content_type, *charset; - FormatterListener *formatterListener; - create_optioned_listener(content_type, charset, formatterListener, - pool, method_name, params, 1, writer); - FormatterTreeWalker treeWalker(*formatterListener); - treeWalker.traverse(&node); // Walk that node and produce the XML... - } catch(const XSLException& e) { - r._throw(&method_name, e); - } +// Text createTextNode(in DOMString data); +static void _createTextNode(Request& r, MethodParams& params) { + xmlChar* data=as_xmlchar(r, params, 0, XML_DATA_MUST_BE_STRING); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlNewDocText(&xmldoc, data); + writeNode(r, vdoc, node); } -static void _string(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXnode& vnode=*static_cast(r.self); - - // node - XalanNode& node=vnode.get_node(pool, &method_name); - - try { - String parserString=*new(pool) String(pool); - ParserStringXalanOutputStream stream(parserString); - XalanOutputStreamPrintWriter writer(stream); - const char *content_type, *charset; - FormatterListener *formatterListener; - create_optioned_listener(content_type, charset, formatterListener, - pool, method_name, params, 0, writer); - FormatterTreeWalker treeWalker(*formatterListener); - treeWalker.traverse(&node); // Walk that node and produce the XML... - - // write out result - r.write_no_lang(parserString); - } catch(const XSLException& e) { - r._throw(&method_name, e); - } +// Comment createComment(in DOMString data) +static void _createComment(Request& r, MethodParams& params) { + xmlChar* data=as_xmlchar(r, params, 0, XML_DATA_MUST_BE_STRING); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + + xmlNode *node=xmlNewComment(data); + writeNode(r, vdoc, node); } +// CDATASection createCDATASection(in DOMString data) raises(DOMException); +static void _createCDATASection(Request& r, MethodParams& params) { + xmlChar* data=as_xmlchar(r, params, 0, XML_DATA_MUST_BE_STRING); -static void _file(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXnode& vnode=*static_cast(r.self); - - // node - XalanNode& node=vnode.get_node(pool, &method_name); - - try { - String& parserString=*new(pool) String(pool); - ParserStringXalanOutputStream stream(parserString); - XalanOutputStreamPrintWriter writer(stream); - const char *content_type, *charset; - FormatterListener *formatterListener; - create_optioned_listener(content_type, charset, formatterListener, - pool, method_name, params, 0, writer); - FormatterTreeWalker treeWalker(*formatterListener); - treeWalker.traverse(&node); // Walk that node and produce the XML... - - // write out result - VFile& vfile=*new(pool) VFile(pool); - const char *cstr=parserString.cstr(); - String *scontent_type=new(pool) String(pool, content_type); - Value *vcontent_type; - if(charset) { - VHash *vhcontent_type=new(pool) VHash(pool); - vhcontent_type->hash().put(*value_name, new(pool) VString(*scontent_type)); - String *scharset=new(pool) String(pool, charset); - vhcontent_type->hash().put(*new(pool) String(pool, "charset"), new(pool) VString(*scharset)); - vcontent_type=vhcontent_type; - } else - vcontent_type=new(pool) VString(*scontent_type); - vfile.set(false/*tainted*/, cstr, strlen(cstr), 0/*file_name*/, vcontent_type); - r.write_no_lang(vfile); - } catch(const XSLException& e) { - r._throw(&method_name, e); - } + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlNewCDataBlock(&xmldoc, data, strlen((const char*)data)); + writeNode(r, vdoc, node); } -static void _set(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdom=*static_cast(r.self); - - Value& vxml=params->as_junction(0, "xml must be code"); - Temp_lang temp_lang(r, String::UL_XML); - const String& xml=r.process(vxml).as_string(); - - std::istrstream stream(xml.cstr()); - const XalanParsedSource* parsedSource; - int error=vdom.transformer().parseSource(&stream, parsedSource); - - if(error) - PTHROW(0, 0, - &method_name, - vdom.transformer().getLastError()); +// ProcessingInstruction createProcessingInstruction(in DOMString target,in DOMString data) raises(DOMException); +static void _createProcessingInstruction(Request& r, MethodParams& params) { + xmlChar* target=as_xmlchar(r, params, 0, XML_DATA_MUST_BE_STRING); + xmlChar* data=as_xmlchar(r, params, 1, XML_DATA_MUST_BE_STRING); - // replace any previous parsed source - vdom.set_parsed_source(*parsedSource); + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlNewDocPI(&xmldoc, target, data); + writeNode(r, vdoc, node); } -static void _load(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdom=*static_cast(r.self); +// Attr createAttribute(in DOMString name) raises(DOMException); +static void _createAttribute(Request& r, MethodParams& params) { + xmlChar* name=as_xmlname(r, params, 0); - // filespec - const String& file_name=params->as_string(0, "file name must not be code"); - const char *filespec=r.absolute(file_name).cstr(String::UL_FILE_SPEC); + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=(xmlNode*)xmlNewDocProp(&xmldoc, name, 0); + writeNode(r, vdoc, node); +} + +// Attr createAttributeNS(in DOMString namespaceURI, in DOMString qualifiedName) raises(DOMException); +static void _createAttributeNS(Request& r, MethodParams& params) { + xmlChar* namespaceURI=as_xmlnsuri(r, params, 0); + xmlChar* qualifiedName=as_xmlqname(r, params, 1); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlChar* prefix=0; + xmlChar* localName=xmlSplitQName2(qualifiedName, &prefix); + + xmlNode *node; + if(localName) { + xmlNs& ns=pa_xmlMapNs(xmldoc, namespaceURI, prefix); + node=(xmlNode*)xmlNewDocProp(&xmldoc, localName, NULL); + xmlSetNs(node, &ns); + } else + node=(xmlNode*)xmlNewDocProp(&xmldoc, qualifiedName/*unqualified, actually*/, NULL); + writeNode(r, vdoc, node); +} + +// EntityReference createEntityReference(in DOMString name) raises(DOMException); +static void _createEntityReference(Request& r, MethodParams& params) { + xmlChar* name=as_xmlname(r, params, 0); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlNewReference(&xmldoc, name); + writeNode(r, vdoc, node); +} + + +static void _getElementById(Request& r, MethodParams& params) { + xmlChar* elementId=as_xmlname(r, params, 0, "elementID must be string"); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + if(xmlNode *node=pa_getElementById(xmldoc, elementId)) + writeNode(r, vdoc, node); +} + +static void _importNode(Request& r, MethodParams& params) { + xmlNode& importedNode=as_node(params, 0, "importedNode must be node"); + bool deep=params.as_bool(1, "deep must be bool", r); + + VXdoc& vdoc=GET_SELF(r, VXdoc); + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xmlNode *node=xmlDocCopyNode(&importedNode, &xmldoc, deep?1: 0); + writeNode(r, vdoc, node); +} + +/* +GdomeElement *gdome_doc_createElementNS (GdomeDocument *self, GdomeDOMString *namespaceURI, GdomeDOMString *qualifiedName, GdomeException *exc); +GdomeAttr *gdome_doc_createAttributeNS (GdomeDocument *self, GdomeDOMString *namespaceURI, GdomeDOMString *qualifiedName, GdomeException *exc); +*/ + +static void _create(Request& r, MethodParams& params) { + Charset& source_charset=r.charsets.source(); + VXdoc& vdoc=GET_SELF(r, VXdoc); + + Value& param=params[params.count()-1]; + xmlDoc* xmldoc; + bool set_encoding=false; + if(param.get_junction()) { // {...} + Temp_lang temp_lang(r, String::L_XML); + const String& xml=r.process_to_string(param); + + String::Body sbody=xml.cstr_to_string_body_untaint(r.flang, r.connection(false), &r.charsets); + xmldoc=xmlParseMemory(sbody.cstr(), sbody.length()); + + //printf("document=0x%p\n", document); + if(!xmldoc || xmlHaveGenericErrors()) + throw XmlException(0, r); + + // must be last action in if, see after if} + } else { // [localName] + if(const String* value = param.get_string()){ + xmlChar* localName=r.transcode(*value); + if(xmlValidateNCName(localName, 0) != 0) + throw XmlException(0, XML_INVALID_LOCAL_NAME, localName); + +#if 0 + GdomeDocumentType *documentType=gdome_di_createDocumentType ( + docimpl, + r.transcode(qualifiedName), + 0/*publicId*/, + 0/*systemId*/, + &exc); + if(!documentType || exc || xmlHaveGenericErrors()) + throw Exception( + method_name, + exc); + /// +xalan createXMLDecl ? +#endif + xmldoc=xmlNewDoc(0); + if(!xmldoc || xmlHaveGenericErrors()) + throw XmlException(0, r); + + xmlNode* node=xmlNewChild((xmlNode*)xmldoc, NULL, localName, NULL); + if(!node || xmlHaveGenericErrors()) + throw XmlException(0, r); + + set_encoding=true; + // must be last action in if, see after if} + } else { + VFile* vfile=param.as_vfile(String::L_AS_IS); + xmldoc=xmlParseMemory(vfile->value_ptr(), vfile->value_size()); + if(!xmldoc || xmlHaveGenericErrors()) + throw XmlException(0, r); + } + } + // must be first action after if} + // replace any previous parsed source + vdoc.set_xmldoc(r.charsets, *xmldoc); - const XalanParsedSource* parsedSource; - int error=vdom.transformer().parseSource(filespec, parsedSource); + // URI + const char* URI_cstr; + if(params.count()>1) { // absolute(param) + const String& URI=params.as_string(0, "URI must be string"); + URI_cstr=r.absolute(URI).cstr(); + } else // default = disk path to requested document + URI_cstr=r.request_info.path_translated; + if(URI_cstr) + xmldoc->URL=source_charset.transcode_buf2xchar(URI_cstr, strlen(URI_cstr)); + + if(set_encoding) { + const char* source_charset_name=source_charset.NAME().cstr(); + xmldoc->encoding=source_charset.transcode_buf2xchar(source_charset_name, strlen(source_charset_name)); + } +} - if(error) - PTHROW(0, 0, - &file_name, - vdom.transformer().getLastError()); +static void _load(Request& r, MethodParams& params) { + VXdoc& vdoc=GET_SELF(r, VXdoc); + // filespec + const String* uri=¶ms.as_string(0, "URI must be string"); + const char* uri_cstr; + if(uri->pos("://")==STRING_NOT_FOUND) // disk path + uri_cstr=r.absolute(*uri).taint_cstr(String::L_FILE_SPEC); + else // xxx:// + uri_cstr=uri->taint_cstr(String::L_AS_IS); // leave as-is for xmlParseFile to handle + + /// @todo!! add SAFE MODE!! + xmlDoc* xmldoc=xmlParseFile(uri_cstr); + if(!xmldoc || xmlHaveGenericErrors()) + throw XmlException(uri, r); + + // must be first action after if} // replace any previous parsed source - vdom.set_parsed_source(*parsedSource); + vdoc.set_xmldoc(r.charsets, *xmldoc); } -static void add_xslt_param(const Hash::Key& aattribute, Hash::Val *ameaning, - void *info) { - XalanTransformer& transformer=*static_cast(info); - const char *attribute_cstr=aattribute.cstr(); - const char *meaning_cstr=static_cast(ameaning)->as_string().cstr(); - - transformer.setStylesheetParam( - XalanDOMString(attribute_cstr), - XalanDOMString(meaning_cstr)); -} -static void _xslt(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdom=*static_cast(r.self); +String::C xdoc2buf(Request& r, VXdoc& vdoc, + XDocOutputOptions& oo, + const String* file_spec, + bool use_source_charset_to_render_and_client_charset_to_write_to_header=false) { + Charset* render=0; + Charset* header=0; + if(use_source_charset_to_render_and_client_charset_to_write_to_header) { + render=&r.charsets.source(); + header=&r.charsets.client(); + } else { + header=render=&charsets.get(oo.encoding->change_case(r.charsets.source(), String::CC_UPPER)); + } + const char* render_encoding=render->NAME_CSTR(); + const char* header_encoding=header->NAME_CSTR(); - // params - if(params->size()>1) { - Value& vparams=params->as_no_junction(1, "transform parameters parameter must not be code"); - if(vparams.is_defined()) - if(Hash *params=vparams.get_hash()) - params->for_each(add_xslt_param, &vdom.transformer()); - else - PTHROW(0, 0, - &method_name, - "transform parameters parameter must be hash"); + xmlCharEncodingHandler *renderer=xmlFindCharEncodingHandler(render_encoding); + // UTF-8 renderer contains empty input/output converters, + // which is wrong for xmlOutputBufferCreateIO + // while zero renderer goes perfectly + if(render->isUTF8()) + renderer=0; + + xmlOutputBuffer_auto_ptr outputBuffer(xmlAllocOutputBuffer(renderer)); + + xsltStylesheet_auto_ptr stylesheet(xsltNewStylesheet()); + if(!stylesheet.get()) + throw Exception(0, + 0, + "xsltNewStylesheet failed"); + + #define OOSTRING2STYLE(name) \ + stylesheet->name=oo.name?BAD_CAST xmlMemStrdup((const char*)r.transcode(*oo.name)):0 + #define OOBOOL2STYLE(name) \ + if(oo.name>=0) stylesheet->name=oo.name + + OOSTRING2STYLE(method); + OOSTRING2STYLE(encoding); + OOSTRING2STYLE(mediaType); +// OOSTRING2STYLE(doctypeSystem); +// OOSTRING2STYLE(doctypePublic); + OOBOOL2STYLE(indent); + OOSTRING2STYLE(version); + OOBOOL2STYLE(standalone); + OOBOOL2STYLE(omitXmlDeclaration); + + xmlDoc& xmldoc=vdoc.get_xmldoc(); + xmldoc.encoding=BAD_CAST xmlMemStrdup(render_encoding); + if(header_encoding) + stylesheet->encoding=BAD_CAST xmlMemStrdup(header_encoding); + if(xsltSaveResultTo(outputBuffer.get(), &xmldoc, stylesheet.get())<0 + || xmlHaveGenericErrors()) + throw XmlException(0, r); + + // write out result + char *gnome_str; + size_t gnome_length; +#ifdef LIBXML2_NEW_BUFFER + if(outputBuffer->conv) { + gnome_length=xmlBufUse(outputBuffer->conv); + gnome_str=(char *)xmlBufContent(outputBuffer->conv); + } else { + gnome_length=xmlOutputBufferGetSize(&(*outputBuffer)); + gnome_str=(char *)xmlOutputBufferGetContent(&(*outputBuffer)); } +#else + if(outputBuffer->conv) { + gnome_length=outputBuffer->conv->use; + gnome_str=(char *)outputBuffer->conv->content; + } else { + gnome_length=outputBuffer->buffer->use; + gnome_str=(char *)outputBuffer->buffer->content; + } +#endif + + if(file_spec){ + file_write(r.charsets, + *file_spec, + gnome_str, + gnome_length, + true/*as_text*/); + return String::C(); // actually, we don't need this output at all + } else + return String::C(gnome_length ? pa_strdup(gnome_str, gnome_length) : 0, gnome_length); +} + +inline HashStringValue* get_options(MethodParams& params, size_t index){ + return (params.count()>index) ? params.as_hash(index) : 0; +} + +static void _file(Request& r, MethodParams& params) { + VXdoc& vdoc=GET_SELF(r, VXdoc); + + XDocOutputOptions oo(vdoc.output_options); + oo.append(r, get_options(params, 0), true/* $.name[filename] could be specified by user */); + String::C buf=xdoc2buf(r, vdoc, oo, 0/*file_name. not to file, to memory*/); - // source - const XalanParsedSource &parsed_source=vdom.get_parsed_source(pool, &method_name); + VFile& vfile=*new VFile; + VHash& vhcontent_type=*new VHash; + vhcontent_type.hash().put(value_name, new VString(*oo.mediaType)); + vhcontent_type.hash().put("charset", new VString(*oo.encoding)); - // stylesheet - const String& stylesheet_file_name=params->as_string(0, "file name must not be code"); - const String& stylesheet_filespec=r.absolute(stylesheet_file_name); - //_asm int 3; - Stylesheet_connection& connection=XSLT_stylesheet_manager->get_connection(stylesheet_filespec); - - // target - XalanDocument* target=vdom.parser_liaison().createDocument(); - XSLTResultTarget domResultTarget(target); - - // transform - int error=vdom.transformer().transform( - parsed_source, - &connection.stylesheet(), - domResultTarget); - connection.close(); - if(error) - PTHROW(0, 0, - &stylesheet_file_name, - vdom.transformer().getLastError()); + vfile.set_binary(false/*not tainted*/, buf.str?buf.str:""/*to distinguish from stat-ed file*/, buf.length, oo.filename, &vhcontent_type); // write out result - VXdoc& result=*new(pool) VXdoc(pool); - result.set_document(*target); - r.write_no_lang(result); -} - -static void _getElementById(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdoc=*static_cast(r.self); - - // elementId - const char *elementId=params->as_string(0, "elementID must not be code").cstr(String::UL_AS_IS); - - if(XalanElement *element= - vdoc.get_document(pool, &method_name).getElementById(XalanDOMString(elementId))) { - // write out result - VXnode& result=*new(pool) VXnode(pool, element); - r.write_no_lang(result); - } + r.write_no_lang(vfile); } -static void _getElementsByTagName(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdoc=*static_cast(r.self); - - // tagname - const char *tagname=params->as_string(0, "tagname must not be code").cstr(String::UL_AS_IS); - - VHash& result=*new(pool) VHash(pool); - if(const XalanNodeList *nodes= - vdoc.get_document(pool, &method_name).getElementsByTagName(XalanDOMString(tagname))) { - for(int i=0; igetLength(); i++) { - String& skey=*new(pool) String(pool); - { - char *buf=(char *)pool.malloc(MAX_NUMBER); - snprintf(buf, MAX_NUMBER, "%d", i); - skey << buf; - } +static void _save(Request& r, MethodParams& params) { + VXdoc& vdoc=GET_SELF(r, VXdoc); - result.hash().put(skey, new(pool) VXnode(pool, nodes->item(i))); - } - } + const String& file_spec=r.absolute(params.as_string(0, FILE_NAME_MUST_BE_STRING)); + + XDocOutputOptions oo(vdoc.output_options); + oo.append(r, get_options(params, 1)); + xdoc2buf(r, vdoc, oo, &file_spec); +} + +static void _string(Request& r, MethodParams& params) { + VXdoc& vdoc=GET_SELF(r, VXdoc); + + XDocOutputOptions oo(vdoc.output_options); + oo.append(r, get_options(params, 0)); + String::C buf=xdoc2buf(r, vdoc, oo, + 0/*file_name. not to file, to memory*/, + true/*use source charset to render, client charset to put to header*/); // write out result - r.write_no_lang(result); + r.write_no_lang(String(buf, String::L_AS_IS)); } -static void _getElementsByTagNameNS(Request& r, const String& method_name, MethodParams *params) { - Pool& pool=r.pool(); - VXdoc& vdoc=*static_cast(r.self); - - // namespaceURI;localName - const char *namespaceURI=params->as_string(0, "namespaceURI must not be code").cstr(String::UL_AS_IS); - const char *localName=params->as_string(0, "localName must not be code").cstr(String::UL_AS_IS); - - VHash& result=*new(pool) VHash(pool); - if(const XalanNodeList *nodes= - vdoc.get_document(pool, &method_name).getElementsByTagNameNS( - XalanDOMString(namespaceURI), XalanDOMString(localName))) { - for(int i=0; igetLength(); i++) { - String& skey=*new(pool) String(pool); - { - char *buf=(char *)pool.malloc(MAX_NUMBER); - snprintf(buf, MAX_NUMBER, "%d", i); - skey << buf; - } +#ifndef DOXYGEN +struct Add_xslt_param_info { + Request* r; + Array* strings; + const xmlChar** current_transform_param; +}; +#endif +static void add_xslt_param( + HashStringValue::key_type attribute, + HashStringValue::value_type meaning, + Add_xslt_param_info* info) { + xmlChar* s; + *info->current_transform_param++=(s=info->r->transcode(attribute)); *info->strings+=s; + *info->current_transform_param++=(s=info->r->transcode(meaning->as_string())); *info->strings+=s; +} + +static VXdoc& _transform(Request& r, const String* stylesheet_source, + VXdoc& vdoc, xsltStylesheetPtr stylesheet, const xmlChar** transform_params) +{ + xmlDoc& xmldoc=vdoc.get_xmldoc(); + + xsltTransformContext_auto_ptr transformContext( + xsltNewTransformContext(stylesheet, &xmldoc)); + // make params literal + if (transformContext->globalVars == NULL) // strangly not initialized by xsltNewTransformContext + transformContext->globalVars = xmlHashCreate(20); + xsltQuoteUserParams(transformContext.get(), (const char**)transform_params); + // do transform + xmlDoc *transformed=xsltApplyStylesheetUser( + stylesheet, + &xmldoc, + 0/*already quoted-inserted transform_params*/, + 0/*const char* output*/, + 0/*FILE *profile*/, + transformContext.get()); + if(!transformed || xmlHaveGenericErrors()) + throw XmlException(stylesheet_source, r); + + //gdome_xml_doc_mkref dislikes XML_HTML_DOCUMENT_NODE type, fixing + transformed->type=XML_DOCUMENT_NODE; + // constructing result + VXdoc& result=*new VXdoc(r.charsets, *transformed); + /* grabbing options + + + */ + XDocOutputOptions& oo=result.output_options; + + oo.method=stylesheet->method?&r.transcode(stylesheet->method):0; + oo.encoding=stylesheet->encoding?&r.transcode(stylesheet->encoding):0; + oo.mediaType=stylesheet->mediaType?&r.transcode(stylesheet->mediaType):0; + oo.indent=stylesheet->indent; + oo.version=stylesheet->version?&r.transcode(stylesheet->version):0; + oo.standalone=stylesheet->standalone; + oo.omitXmlDeclaration=stylesheet->omitXmlDeclaration; - result.hash().put(skey, new(pool) VXnode(pool, nodes->item(i))); + // return + return result; +} +static void _transform(Request& r, MethodParams& params) { + VXdoc& vdoc=GET_SELF(r, VXdoc); + + // params + Array transform_strings; + const xmlChar** transform_params=0; + if(params.count()>1) + if(HashStringValue* hash=params.as_hash(1, "transform options")) { + transform_params=new const xmlChar*[hash->count()*2+1]; + Add_xslt_param_info info={ + &r, + &transform_strings, + transform_params + }; + hash->for_each(add_xslt_param, &info); + transform_params[hash->count()*2]=0; } + + VXdoc* result; + if(Value *vxdoc=params[0].as(VXDOC_TYPE)) { // stylesheet (xdoc) + xmlDoc& stylesheetdoc=static_cast(vxdoc)->get_xmldoc(); + // compile xdoc stylesheet + xsltStylesheet_auto_ptr stylesheet_ptr(xsltParseStylesheetDoc(&stylesheetdoc)); + if(xmlHaveGenericErrors()) + throw XmlException(0, r); + if(!stylesheet_ptr.get()) + throw Exception("xml", + 0, + "stylesheet failed to compile"); + // strange thing - xsltParseStylesheetDoc records document and destroys it in stylesheet destructor + // we don't need that + stylesheet_ptr->doc=0; + + // transform! + result=&_transform(r, 0, + vdoc, stylesheet_ptr.get(), + transform_params); + } else { // stylesheet (file name) + // extablish stylesheet connection + const String& stylesheet_filespec= + r.absolute(params.as_string(0, "stylesheet must be file name (string) or DOM document (xdoc)")); + Stylesheet_connection_ptr connection=stylesheet_manager->get_connection(stylesheet_filespec); + + // load and compile file to stylesheet [or get cached if any] + // transform! + result=&_transform(r, &stylesheet_filespec, vdoc, connection->stylesheet(), + transform_params); } // write out result - r.write_no_lang(result); + r.write_no_lang(*result); } // constructor -MXdoc::MXdoc(Pool& apool) : MXnode(apool) { - set_name(*NEW String(pool(), XDOC_CLASS_NAME)); +/// @test how to create empty type html? +MXdoc::MXdoc(): MXnode(XDOC_CLASS_NAME) { + set_base(xnode_class); + + /// DOM1 + + // Element createElement(in DOMString tagName) raises(DOMException); + add_native_method("createElement", Method::CT_DYNAMIC, _createElement, 1, 1); + // DocumentFragment createDocumentFragment(); + add_native_method("createDocumentFragment", Method::CT_DYNAMIC, _createDocumentFragment, 0, 0); + // Text createTextNode(in DOMString data); + add_native_method("createTextNode", Method::CT_DYNAMIC, _createTextNode, 1, 1); + // Comment createComment(in DOMString data); + add_native_method("createComment", Method::CT_DYNAMIC, _createComment, 1, 1); + // CDATASection createCDATASection(in DOMString data) raises(DOMException); + add_native_method("createCDATASection", Method::CT_DYNAMIC, _createCDATASection, 1, 1); + // ProcessingInstruction createProcessingInstruction(in DOMString target, in DOMString data) raises(DOMException); + add_native_method("createProcessingInstruction", Method::CT_DYNAMIC, _createProcessingInstruction, 2, 2); + // Attr createAttribute(in DOMString name) raises(DOMException); + add_native_method("createAttribute", Method::CT_DYNAMIC, _createAttribute, 1, 1); + // EntityReference createEntityReference(in DOMString name) raises(DOMException); + add_native_method("createEntityReference", Method::CT_DYNAMIC, _createEntityReference, 1, 1); + + /// DOM2 + + // ^xdoc.getElementById[elementId] + add_native_method("getElementById", Method::CT_DYNAMIC, _getElementById, 1, 1); + + // Node (in Node importedNode, in boolean deep) raises(DOMException) + add_native_method("importNode", Method::CT_DYNAMIC, _importNode, 2, 2); + + // Attr createAttributeNS(in DOMString namespaceURI, in DOMString qualifiedName) raises(DOMException); + add_native_method("createAttributeNS", Method::CT_DYNAMIC, _createAttributeNS, 2, 2); + + // Element createElementNS(in DOMString namespaceURI, in DOMString qualifiedName) raises(DOMException); + add_native_method("createElementNS", Method::CT_DYNAMIC, _createElementNS, 2, 2); + + /// parser + + // ^xdoc::create{qualifiedName} + // ^xdoc::create[xml] + // ^xdoc::create[URI][xml] + add_native_method("create", Method::CT_DYNAMIC, _create, 1, 2); + // for backward compatibility with <=v 1.82 2002/01/31 11:51:46 paf + add_native_method("set", Method::CT_DYNAMIC, _create, 1, 1); + + // ^xdoc::load[some.xml] + add_native_method("load", Method::CT_DYNAMIC, _load, 1, 1); // ^xdoc.save[some.xml] // ^xdoc.save[some.xml;options hash] @@ -417,40 +782,18 @@ MXdoc::MXdoc(Pool& apool) : MXnode(apool // ^xdoc.file[options hash] file with "" add_native_method("file", Method::CT_DYNAMIC, _file, 0, 1); - // ^xdoc::set[xml] - add_native_method("set", Method::CT_DYNAMIC, _set, 1, 1); - - // ^xdoc::load[some.xml] - add_native_method("load", Method::CT_DYNAMIC, _load, 1, 1); + // ^xdoc.transform[stylesheet file_name/xdoc] + // ^xdoc.transform[stylesheet file_name/xdoc;params hash] + add_native_method("transform", Method::CT_DYNAMIC, _transform, 1, 2); - // ^xdoc.xslt[stylesheet file_name] - // ^xdoc.xslt[stylesheet file_name;params hash] - add_native_method("xslt", Method::CT_DYNAMIC, _xslt, 1, 2); +} - // ^xdoc.getElementById[elementId] - add_native_method("getElementById", Method::CT_DYNAMIC, _getElementById, 1, 1); - - // ^xdoc.getElementById[tagname] - add_native_method("getElementsByTagName", Method::CT_DYNAMIC, _getElementsByTagName, 1, 1); +# else - // ^xdoc.getElementsByTagNameNS[namespaceURI;localName] = array of nodes - add_native_method("getElementsByTagNameNS", Method::CT_DYNAMIC, _getElementsByTagNameNS, 2, 2); +#include "classes.h" -} // global variable -Methoded *Xdoc_class; - -// creator - -#endif +DECLARE_CLASS_VAR(xdoc, 0); // fictive -Methoded *MXdoc_create(Pool& pool) { - return -#ifdef XML - Xdoc_class=new(pool) MXdoc(pool); -#else - 0 #endif - ; -}