12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208120912101211121212131214121512161217121812191220122112221223122412251226122712281229123012311232123312341235123612371238123912401241124212431244124512461247124812491250125112521253125412551256125712581259126012611262126312641265126612671268126912701271127212731274127512761277127812791280128112821283128412851286128712881289129012911292129312941295129612971298129913001301130213031304130513061307130813091310131113121313131413151316131713181319132013211322132313241325132613271328132913301331133213331334133513361337133813391340134113421343134413451346134713481349135013511352135313541355135613571358135913601361136213631364136513661367136813691370137113721373137413751376137713781379138013811382138313841385138613871388138913901391139213931394139513961397139813991400140114021403140414051406140714081409141014111412141314141415141614171418141914201421142214231424142514261427142814291430143114321433143414351436143714381439144014411442144314441445144614471448144914501451145214531454145514561457145814591460146114621463146414651466146714681469147014711472147314741475147614771478147914801481148214831484148514861487148814891490149114921493149414951496149714981499150015011502150315041505150615071508150915101511151215131514151515161517151815191520152115221523152415251526152715281529153015311532153315341535153615371538153915401541154215431544154515461547154815491550155115521553155415551556155715581559156015611562156315641565156615671568156915701571157215731574157515761577157815791580158115821583158415851586158715881589159015911592159315941595159615971598159916001601160216031604160516061607160816091610161116121613161416151616161716181619162016211622162316241625162616271628162916301631163216331634163516361637163816391640164116421643164416451646164716481649165016511652165316541655165616571658165916601661166216631664166516661667166816691670167116721673167416751676167716781679168016811682168316841685168616871688168916901691169216931694169516961697169816991700170117021703170417051706170717081709171017111712171317141715171617171718171917201721172217231724172517261727172817291730173117321733173417351736173717381739174017411742174317441745174617471748 |
- /*
- +----------------------------------------------------------------------+
- | PHP Version 5 |
- +----------------------------------------------------------------------+
- | Copyright (c) 1997-2016 The PHP Group |
- +----------------------------------------------------------------------+
- | This source file is subject to version 3.01 of the PHP license, |
- | that is bundled with this package in the file LICENSE, and is |
- | available through the world-wide-web at the following url: |
- | http://www.php.net/license/3_01.txt |
- | If you did not receive a copy of the PHP license and are unable to |
- | obtain it through the world-wide-web, please send a note to |
- | license@php.net so we can mail you a copy immediately. |
- +----------------------------------------------------------------------+
- | Authors: Stig Sæther Bakken <ssb@php.net> |
- | Thies C. Arntzen <thies@thieso.net> |
- | Sterling Hughes <sterling@php.net> |
- +----------------------------------------------------------------------+
- */
- /* $Id$ */
- #define IS_EXT_MODULE
- #ifdef HAVE_CONFIG_H
- #include "config.h"
- #endif
- #include "php.h"
- #define PHP_XML_INTERNAL
- #include "zend_variables.h"
- #include "ext/standard/php_string.h"
- #include "ext/standard/info.h"
- #include "ext/standard/html.h"
- #if HAVE_XML
- #include "php_xml.h"
- # include "ext/standard/head.h"
- #ifdef LIBXML_EXPAT_COMPAT
- #include "ext/libxml/php_libxml.h"
- #endif
- /* Short-term TODO list:
- * - Implement XML_ExternalEntityParserCreate()
- * - XML_SetCommentHandler
- * - XML_SetCdataSectionHandler
- * - XML_SetParamEntityParsing
- */
- /* Long-term TODO list:
- * - Fix the expat library so you can install your own memory manager
- * functions
- */
- /* Known bugs:
- * - Weird things happen with <![CDATA[]]> sections.
- */
- ZEND_DECLARE_MODULE_GLOBALS(xml)
- /* {{{ dynamically loadable module stuff */
- #ifdef COMPILE_DL_XML
- ZEND_GET_MODULE(xml)
- #endif /* COMPILE_DL_XML */
- /* }}} */
- #define SKIP_TAGSTART(str) ((str) + (parser->toffset > strlen(str) ? strlen(str) : parser->toffset))
- /* {{{ function prototypes */
- PHP_MINIT_FUNCTION(xml);
- PHP_MINFO_FUNCTION(xml);
- static PHP_GINIT_FUNCTION(xml);
- static void xml_parser_dtor(zend_rsrc_list_entry *rsrc TSRMLS_DC);
- static void xml_set_handler(zval **, zval **);
- inline static unsigned short xml_encode_iso_8859_1(unsigned char);
- inline static char xml_decode_iso_8859_1(unsigned short);
- inline static unsigned short xml_encode_us_ascii(unsigned char);
- inline static char xml_decode_us_ascii(unsigned short);
- static zval *xml_call_handler(xml_parser *, zval *, zend_function *, int, zval **);
- static zval *_xml_xmlchar_zval(const XML_Char *, int, const XML_Char *);
- static int _xml_xmlcharlen(const XML_Char *);
- static void _xml_add_to_info(xml_parser *parser,char *name);
- inline static char *_xml_decode_tag(xml_parser *parser, const char *tag);
- void _xml_startElementHandler(void *, const XML_Char *, const XML_Char **);
- void _xml_endElementHandler(void *, const XML_Char *);
- void _xml_characterDataHandler(void *, const XML_Char *, int);
- void _xml_processingInstructionHandler(void *, const XML_Char *, const XML_Char *);
- void _xml_defaultHandler(void *, const XML_Char *, int);
- void _xml_unparsedEntityDeclHandler(void *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
- void _xml_notationDeclHandler(void *, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
- int _xml_externalEntityRefHandler(XML_Parser, const XML_Char *, const XML_Char *, const XML_Char *, const XML_Char *);
- void _xml_startNamespaceDeclHandler(void *, const XML_Char *, const XML_Char *);
- void _xml_endNamespaceDeclHandler(void *, const XML_Char *);
- /* }}} */
- /* {{{ extension definition structures */
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parser_create, 0, 0, 0)
- ZEND_ARG_INFO(0, encoding)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parser_create_ns, 0, 0, 0)
- ZEND_ARG_INFO(0, encoding)
- ZEND_ARG_INFO(0, sep)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_object, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(1, obj)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_element_handler, 0, 0, 3)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, shdl)
- ZEND_ARG_INFO(0, ehdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_character_data_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_processing_instruction_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_default_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_unparsed_entity_decl_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_notation_decl_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_external_entity_ref_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_start_namespace_decl_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_set_end_namespace_decl_handler, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, hdl)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parse, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, data)
- ZEND_ARG_INFO(0, isfinal)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parse_into_struct, 0, 0, 3)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, data)
- ZEND_ARG_INFO(1, values)
- ZEND_ARG_INFO(1, index)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_get_error_code, 0, 0, 1)
- ZEND_ARG_INFO(0, parser)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_error_string, 0, 0, 1)
- ZEND_ARG_INFO(0, code)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_get_current_line_number, 0, 0, 1)
- ZEND_ARG_INFO(0, parser)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_get_current_column_number, 0, 0, 1)
- ZEND_ARG_INFO(0, parser)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_get_current_byte_index, 0, 0, 1)
- ZEND_ARG_INFO(0, parser)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parser_free, 0, 0, 1)
- ZEND_ARG_INFO(0, parser)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parser_set_option, 0, 0, 3)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, option)
- ZEND_ARG_INFO(0, value)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_xml_parser_get_option, 0, 0, 2)
- ZEND_ARG_INFO(0, parser)
- ZEND_ARG_INFO(0, option)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_utf8_encode, 0, 0, 1)
- ZEND_ARG_INFO(0, data)
- ZEND_END_ARG_INFO()
- ZEND_BEGIN_ARG_INFO_EX(arginfo_utf8_decode, 0, 0, 1)
- ZEND_ARG_INFO(0, data)
- ZEND_END_ARG_INFO()
- const zend_function_entry xml_functions[] = {
- PHP_FE(xml_parser_create, arginfo_xml_parser_create)
- PHP_FE(xml_parser_create_ns, arginfo_xml_parser_create_ns)
- PHP_FE(xml_set_object, arginfo_xml_set_object)
- PHP_FE(xml_set_element_handler, arginfo_xml_set_element_handler)
- PHP_FE(xml_set_character_data_handler, arginfo_xml_set_character_data_handler)
- PHP_FE(xml_set_processing_instruction_handler, arginfo_xml_set_processing_instruction_handler)
- PHP_FE(xml_set_default_handler, arginfo_xml_set_default_handler)
- PHP_FE(xml_set_unparsed_entity_decl_handler,arginfo_xml_set_unparsed_entity_decl_handler)
- PHP_FE(xml_set_notation_decl_handler, arginfo_xml_set_notation_decl_handler)
- PHP_FE(xml_set_external_entity_ref_handler, arginfo_xml_set_external_entity_ref_handler)
- PHP_FE(xml_set_start_namespace_decl_handler,arginfo_xml_set_start_namespace_decl_handler)
- PHP_FE(xml_set_end_namespace_decl_handler, arginfo_xml_set_end_namespace_decl_handler)
- PHP_FE(xml_parse, arginfo_xml_parse)
- PHP_FE(xml_parse_into_struct, arginfo_xml_parse_into_struct)
- PHP_FE(xml_get_error_code, arginfo_xml_get_error_code)
- PHP_FE(xml_error_string, arginfo_xml_error_string)
- PHP_FE(xml_get_current_line_number, arginfo_xml_get_current_line_number)
- PHP_FE(xml_get_current_column_number, arginfo_xml_get_current_column_number)
- PHP_FE(xml_get_current_byte_index, arginfo_xml_get_current_byte_index)
- PHP_FE(xml_parser_free, arginfo_xml_parser_free)
- PHP_FE(xml_parser_set_option, arginfo_xml_parser_set_option)
- PHP_FE(xml_parser_get_option, arginfo_xml_parser_get_option)
- PHP_FE(utf8_encode, arginfo_utf8_encode)
- PHP_FE(utf8_decode, arginfo_utf8_decode)
- PHP_FE_END
- };
- #ifdef LIBXML_EXPAT_COMPAT
- static const zend_module_dep xml_deps[] = {
- ZEND_MOD_REQUIRED("libxml")
- ZEND_MOD_END
- };
- #endif
- zend_module_entry xml_module_entry = {
- #ifdef LIBXML_EXPAT_COMPAT
- STANDARD_MODULE_HEADER_EX, NULL,
- xml_deps,
- #else
- STANDARD_MODULE_HEADER,
- #endif
- "xml", /* extension name */
- xml_functions, /* extension function list */
- PHP_MINIT(xml), /* extension-wide startup function */
- NULL, /* extension-wide shutdown function */
- NULL, /* per-request startup function */
- NULL, /* per-request shutdown function */
- PHP_MINFO(xml), /* information function */
- NO_VERSION_YET,
- PHP_MODULE_GLOBALS(xml), /* globals descriptor */
- PHP_GINIT(xml), /* globals ctor */
- NULL, /* globals dtor */
- NULL, /* post deactivate */
- STANDARD_MODULE_PROPERTIES_EX
- };
- /* All the encoding functions are set to NULL right now, since all
- * the encoding is currently done internally by expat/xmltok.
- */
- xml_encoding xml_encodings[] = {
- { (XML_Char *)"ISO-8859-1", xml_decode_iso_8859_1, xml_encode_iso_8859_1 },
- { (XML_Char *)"US-ASCII", xml_decode_us_ascii, xml_encode_us_ascii },
- { (XML_Char *)"UTF-8", NULL, NULL },
- { (XML_Char *)NULL, NULL, NULL }
- };
- static XML_Memory_Handling_Suite php_xml_mem_hdlrs;
- /* True globals, no need for thread safety */
- static int le_xml_parser;
- /* }}} */
- /* {{{ startup, shutdown and info functions */
- static PHP_GINIT_FUNCTION(xml)
- {
- xml_globals->default_encoding = "UTF-8";
- }
- static void *php_xml_malloc_wrapper(size_t sz)
- {
- return emalloc(sz);
- }
- static void *php_xml_realloc_wrapper(void *ptr, size_t sz)
- {
- return erealloc(ptr, sz);
- }
- static void php_xml_free_wrapper(void *ptr)
- {
- if (ptr != NULL) {
- efree(ptr);
- }
- }
- PHP_MINIT_FUNCTION(xml)
- {
- le_xml_parser = zend_register_list_destructors_ex(xml_parser_dtor, NULL, "xml", module_number);
- REGISTER_LONG_CONSTANT("XML_ERROR_NONE", XML_ERROR_NONE, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_NO_MEMORY", XML_ERROR_NO_MEMORY, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_SYNTAX", XML_ERROR_SYNTAX, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_NO_ELEMENTS", XML_ERROR_NO_ELEMENTS, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_INVALID_TOKEN", XML_ERROR_INVALID_TOKEN, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_UNCLOSED_TOKEN", XML_ERROR_UNCLOSED_TOKEN, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_PARTIAL_CHAR", XML_ERROR_PARTIAL_CHAR, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_TAG_MISMATCH", XML_ERROR_TAG_MISMATCH, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_DUPLICATE_ATTRIBUTE", XML_ERROR_DUPLICATE_ATTRIBUTE, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_JUNK_AFTER_DOC_ELEMENT", XML_ERROR_JUNK_AFTER_DOC_ELEMENT, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_PARAM_ENTITY_REF", XML_ERROR_PARAM_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_UNDEFINED_ENTITY", XML_ERROR_UNDEFINED_ENTITY, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_RECURSIVE_ENTITY_REF", XML_ERROR_RECURSIVE_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_ASYNC_ENTITY", XML_ERROR_ASYNC_ENTITY, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_BAD_CHAR_REF", XML_ERROR_BAD_CHAR_REF, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_BINARY_ENTITY_REF", XML_ERROR_BINARY_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF", XML_ERROR_ATTRIBUTE_EXTERNAL_ENTITY_REF, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_MISPLACED_XML_PI", XML_ERROR_MISPLACED_XML_PI, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_UNKNOWN_ENCODING", XML_ERROR_UNKNOWN_ENCODING, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_INCORRECT_ENCODING", XML_ERROR_INCORRECT_ENCODING, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_UNCLOSED_CDATA_SECTION", XML_ERROR_UNCLOSED_CDATA_SECTION, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_ERROR_EXTERNAL_ENTITY_HANDLING", XML_ERROR_EXTERNAL_ENTITY_HANDLING, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_OPTION_CASE_FOLDING", PHP_XML_OPTION_CASE_FOLDING, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_OPTION_TARGET_ENCODING", PHP_XML_OPTION_TARGET_ENCODING, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_OPTION_SKIP_TAGSTART", PHP_XML_OPTION_SKIP_TAGSTART, CONST_CS|CONST_PERSISTENT);
- REGISTER_LONG_CONSTANT("XML_OPTION_SKIP_WHITE", PHP_XML_OPTION_SKIP_WHITE, CONST_CS|CONST_PERSISTENT);
- /* this object should not be pre-initialised at compile time,
- as the order of members may vary */
- php_xml_mem_hdlrs.malloc_fcn = php_xml_malloc_wrapper;
- php_xml_mem_hdlrs.realloc_fcn = php_xml_realloc_wrapper;
- php_xml_mem_hdlrs.free_fcn = php_xml_free_wrapper;
- #ifdef LIBXML_EXPAT_COMPAT
- REGISTER_STRING_CONSTANT("XML_SAX_IMPL", "libxml", CONST_CS|CONST_PERSISTENT);
- #else
- REGISTER_STRING_CONSTANT("XML_SAX_IMPL", "expat", CONST_CS|CONST_PERSISTENT);
- #endif
- return SUCCESS;
- }
- PHP_MINFO_FUNCTION(xml)
- {
- php_info_print_table_start();
- php_info_print_table_row(2, "XML Support", "active");
- php_info_print_table_row(2, "XML Namespace Support", "active");
- #if defined(LIBXML_DOTTED_VERSION) && defined(LIBXML_EXPAT_COMPAT)
- php_info_print_table_row(2, "libxml2 Version", LIBXML_DOTTED_VERSION);
- #else
- php_info_print_table_row(2, "EXPAT Version", XML_ExpatVersion());
- #endif
- php_info_print_table_end();
- }
- /* }}} */
- /* {{{ extension-internal functions */
- static zval *_xml_resource_zval(long value)
- {
- zval *ret;
- TSRMLS_FETCH();
- MAKE_STD_ZVAL(ret);
- Z_TYPE_P(ret) = IS_RESOURCE;
- Z_LVAL_P(ret) = value;
- zend_list_addref(value);
- return ret;
- }
- static zval *_xml_string_zval(const char *str)
- {
- zval *ret;
- int len = strlen(str);
- MAKE_STD_ZVAL(ret);
- Z_TYPE_P(ret) = IS_STRING;
- Z_STRLEN_P(ret) = len;
- Z_STRVAL_P(ret) = estrndup(str, len);
- return ret;
- }
- static zval *_xml_xmlchar_zval(const XML_Char *s, int len, const XML_Char *encoding)
- {
- zval *ret;
- MAKE_STD_ZVAL(ret);
- if (s == NULL) {
- ZVAL_FALSE(ret);
- return ret;
- }
- if (len == 0) {
- len = _xml_xmlcharlen(s);
- }
- Z_TYPE_P(ret) = IS_STRING;
- Z_STRVAL_P(ret) = xml_utf8_decode(s, len, &Z_STRLEN_P(ret), encoding);
- return ret;
- }
- /* }}} */
- /* {{{ xml_parser_dtor() */
- static void xml_parser_dtor(zend_rsrc_list_entry *rsrc TSRMLS_DC)
- {
- xml_parser *parser = (xml_parser *)rsrc->ptr;
- if (parser->parser) {
- XML_ParserFree(parser->parser);
- }
- if (parser->ltags) {
- int inx;
- for (inx = 0; ((inx < parser->level) && (inx < XML_MAXLEVEL)); inx++)
- efree(parser->ltags[ inx ]);
- efree(parser->ltags);
- }
- if (parser->startElementHandler) {
- zval_ptr_dtor(&parser->startElementHandler);
- }
- if (parser->endElementHandler) {
- zval_ptr_dtor(&parser->endElementHandler);
- }
- if (parser->characterDataHandler) {
- zval_ptr_dtor(&parser->characterDataHandler);
- }
- if (parser->processingInstructionHandler) {
- zval_ptr_dtor(&parser->processingInstructionHandler);
- }
- if (parser->defaultHandler) {
- zval_ptr_dtor(&parser->defaultHandler);
- }
- if (parser->unparsedEntityDeclHandler) {
- zval_ptr_dtor(&parser->unparsedEntityDeclHandler);
- }
- if (parser->notationDeclHandler) {
- zval_ptr_dtor(&parser->notationDeclHandler);
- }
- if (parser->externalEntityRefHandler) {
- zval_ptr_dtor(&parser->externalEntityRefHandler);
- }
- if (parser->unknownEncodingHandler) {
- zval_ptr_dtor(&parser->unknownEncodingHandler);
- }
- if (parser->startNamespaceDeclHandler) {
- zval_ptr_dtor(&parser->startNamespaceDeclHandler);
- }
- if (parser->endNamespaceDeclHandler) {
- zval_ptr_dtor(&parser->endNamespaceDeclHandler);
- }
- if (parser->baseURI) {
- efree(parser->baseURI);
- }
- if (parser->object) {
- zval_ptr_dtor(&parser->object);
- }
- efree(parser);
- }
- /* }}} */
- /* {{{ xml_set_handler() */
- static void xml_set_handler(zval **handler, zval **data)
- {
- /* If we have already a handler, release it */
- if (*handler) {
- zval_ptr_dtor(handler);
- }
- /* IS_ARRAY might indicate that we're using array($obj, 'method') syntax */
- if (Z_TYPE_PP(data) != IS_ARRAY && Z_TYPE_PP(data) != IS_OBJECT) {
- convert_to_string_ex(data);
- if (Z_STRLEN_PP(data) == 0) {
- *handler = NULL;
- return;
- }
- }
- zval_add_ref(data);
- *handler = *data;
- }
- /* }}} */
- /* {{{ xml_call_handler() */
- static zval *xml_call_handler(xml_parser *parser, zval *handler, zend_function *function_ptr, int argc, zval **argv)
- {
- int i;
- TSRMLS_FETCH();
- if (parser && handler && !EG(exception)) {
- zval ***args;
- zval *retval;
- int result;
- zend_fcall_info fci;
- args = safe_emalloc(sizeof(zval **), argc, 0);
- for (i = 0; i < argc; i++) {
- args[i] = &argv[i];
- }
- fci.size = sizeof(fci);
- fci.function_table = EG(function_table);
- fci.function_name = handler;
- fci.symbol_table = NULL;
- fci.object_ptr = parser->object;
- fci.retval_ptr_ptr = &retval;
- fci.param_count = argc;
- fci.params = args;
- fci.no_separation = 0;
- /*fci.function_handler_cache = &function_ptr;*/
- result = zend_call_function(&fci, NULL TSRMLS_CC);
- if (result == FAILURE) {
- zval **method;
- zval **obj;
- if (Z_TYPE_P(handler) == IS_STRING) {
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to call handler %s()", Z_STRVAL_P(handler));
- } else if (Z_TYPE_P(handler) == IS_ARRAY &&
- zend_hash_index_find(Z_ARRVAL_P(handler), 0, (void **) &obj) == SUCCESS &&
- zend_hash_index_find(Z_ARRVAL_P(handler), 1, (void **) &method) == SUCCESS &&
- Z_TYPE_PP(obj) == IS_OBJECT &&
- Z_TYPE_PP(method) == IS_STRING) {
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to call handler %s::%s()", Z_OBJCE_PP(obj)->name, Z_STRVAL_PP(method));
- } else
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unable to call handler");
- }
- for (i = 0; i < argc; i++) {
- zval_ptr_dtor(args[i]);
- }
- efree(args);
- if (result == FAILURE) {
- return NULL;
- } else {
- return EG(exception) ? NULL : retval;
- }
- } else {
- for (i = 0; i < argc; i++) {
- zval_ptr_dtor(&argv[i]);
- }
- return NULL;
- }
- }
- /* }}} */
- /* {{{ xml_encode_iso_8859_1() */
- inline static unsigned short xml_encode_iso_8859_1(unsigned char c)
- {
- return (unsigned short)c;
- }
- /* }}} */
- /* {{{ xml_decode_iso_8859_1() */
- inline static char xml_decode_iso_8859_1(unsigned short c)
- {
- return (char)(c > 0xff ? '?' : c);
- }
- /* }}} */
- /* {{{ xml_encode_us_ascii() */
- inline static unsigned short xml_encode_us_ascii(unsigned char c)
- {
- return (unsigned short)c;
- }
- /* }}} */
- /* {{{ xml_decode_us_ascii() */
- inline static char xml_decode_us_ascii(unsigned short c)
- {
- return (char)(c > 0x7f ? '?' : c);
- }
- /* }}} */
- /* {{{ xml_get_encoding() */
- static xml_encoding *xml_get_encoding(const XML_Char *name)
- {
- xml_encoding *enc = &xml_encodings[0];
- while (enc && enc->name) {
- if (strcasecmp(name, enc->name) == 0) {
- return enc;
- }
- enc++;
- }
- return NULL;
- }
- /* }}} */
- /* {{{ xml_utf8_encode */
- PHPAPI char *xml_utf8_encode(const char *s, int len, int *newlen, const XML_Char *encoding)
- {
- int pos = len;
- char *newbuf;
- unsigned int c;
- unsigned short (*encoder)(unsigned char) = NULL;
- xml_encoding *enc = xml_get_encoding(encoding);
- *newlen = 0;
- if (enc) {
- encoder = enc->encoding_function;
- } else {
- /* If the target encoding was unknown, fail */
- return NULL;
- }
- if (encoder == NULL) {
- /* If no encoder function was specified, return the data as-is.
- */
- newbuf = emalloc(len + 1);
- memcpy(newbuf, s, len);
- *newlen = len;
- newbuf[*newlen] = '\0';
- return newbuf;
- }
- /* This is the theoretical max (will never get beyond len * 2 as long
- * as we are converting from single-byte characters, though) */
- newbuf = safe_emalloc_string(len, 4, 1);
- while (pos > 0) {
- c = encoder ? encoder((unsigned char)(*s)) : (unsigned short)(*s);
- if (c < 0x80) {
- newbuf[(*newlen)++] = (char) c;
- } else if (c < 0x800) {
- newbuf[(*newlen)++] = (0xc0 | (c >> 6));
- newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
- } else if (c < 0x10000) {
- newbuf[(*newlen)++] = (0xe0 | (c >> 12));
- newbuf[(*newlen)++] = (0xc0 | ((c >> 6) & 0x3f));
- newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
- } else if (c < 0x200000) {
- newbuf[(*newlen)++] = (0xf0 | (c >> 18));
- newbuf[(*newlen)++] = (0xe0 | ((c >> 12) & 0x3f));
- newbuf[(*newlen)++] = (0xc0 | ((c >> 6) & 0x3f));
- newbuf[(*newlen)++] = (0x80 | (c & 0x3f));
- }
- pos--;
- s++;
- }
- newbuf[*newlen] = 0;
- newbuf = erealloc(newbuf, (*newlen)+1);
- return newbuf;
- }
- /* }}} */
- /* {{{ xml_utf8_decode */
- PHPAPI char *xml_utf8_decode(const XML_Char *s, int len, int *newlen, const XML_Char *encoding)
- {
- size_t pos = 0;
- char *newbuf = emalloc(len + 1);
- unsigned int c;
- char (*decoder)(unsigned short) = NULL;
- xml_encoding *enc = xml_get_encoding(encoding);
- *newlen = 0;
- if (enc) {
- decoder = enc->decoding_function;
- }
- if (decoder == NULL) {
- /* If the target encoding was unknown, or no decoder function
- * was specified, return the UTF-8-encoded data as-is.
- */
- memcpy(newbuf, s, len);
- *newlen = len;
- newbuf[*newlen] = '\0';
- return newbuf;
- }
- while (pos < (size_t)len) {
- int status = FAILURE;
- c = php_next_utf8_char((const unsigned char*)s, (size_t) len, &pos, &status);
- if (status == FAILURE || c > 0xFFU) {
- c = '?';
- }
- newbuf[*newlen] = decoder ? decoder(c) : c;
- ++*newlen;
- }
- if (*newlen < len) {
- newbuf = erealloc(newbuf, *newlen + 1);
- }
- newbuf[*newlen] = '\0';
- return newbuf;
- }
- /* }}} */
- /* {{{ _xml_xmlcharlen() */
- static int _xml_xmlcharlen(const XML_Char *s)
- {
- int len = 0;
- while (*s) {
- len++;
- s++;
- }
- return len;
- }
- /* }}} */
- /* {{{ _xml_zval_strdup() */
- PHPAPI char *_xml_zval_strdup(zval *val)
- {
- if (Z_TYPE_P(val) == IS_STRING) {
- char *buf = emalloc(Z_STRLEN_P(val) + 1);
- memcpy(buf, Z_STRVAL_P(val), Z_STRLEN_P(val));
- buf[Z_STRLEN_P(val)] = '\0';
- return buf;
- }
- return NULL;
- }
- /* }}} */
- /* {{{ _xml_add_to_info */
- static void _xml_add_to_info(xml_parser *parser,char *name)
- {
- zval **element, *values;
- if (! parser->info) {
- return;
- }
- if (zend_hash_find(Z_ARRVAL_P(parser->info),name,strlen(name) + 1,(void **) &element) == FAILURE) {
- MAKE_STD_ZVAL(values);
- array_init(values);
- zend_hash_update(Z_ARRVAL_P(parser->info), name, strlen(name)+1, (void *) &values, sizeof(zval*), (void **) &element);
- }
- add_next_index_long(*element,parser->curtag);
- parser->curtag++;
- }
- /* }}} */
- /* {{{ _xml_decode_tag() */
- static char *_xml_decode_tag(xml_parser *parser, const char *tag)
- {
- char *newstr;
- int out_len;
- newstr = xml_utf8_decode(tag, strlen(tag), &out_len, parser->target_encoding);
- if (parser->case_folding) {
- php_strtoupper(newstr, out_len);
- }
- return newstr;
- }
- /* }}} */
- /* {{{ _xml_startElementHandler() */
- void _xml_startElementHandler(void *userData, const XML_Char *name, const XML_Char **attributes)
- {
- xml_parser *parser = (xml_parser *)userData;
- const char **attrs = (const char **) attributes;
- char *tag_name;
- char *att, *val;
- int val_len;
- zval *retval, *args[3];
- if (parser) {
- parser->level++;
- tag_name = _xml_decode_tag(parser, name);
- if (parser->startElementHandler) {
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_string_zval(SKIP_TAGSTART((char *) tag_name));
- MAKE_STD_ZVAL(args[2]);
- array_init(args[2]);
- while (attributes && *attributes) {
- att = _xml_decode_tag(parser, attributes[0]);
- val = xml_utf8_decode(attributes[1], strlen(attributes[1]), &val_len, parser->target_encoding);
- add_assoc_stringl(args[2], att, val, val_len, 0);
- attributes += 2;
- efree(att);
- }
- if ((retval = xml_call_handler(parser, parser->startElementHandler, parser->startElementPtr, 3, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- if (parser->data) {
- if (parser->level <= XML_MAXLEVEL) {
- zval *tag, *atr;
- int atcnt = 0;
- MAKE_STD_ZVAL(tag);
- MAKE_STD_ZVAL(atr);
- array_init(tag);
- array_init(atr);
- _xml_add_to_info(parser,SKIP_TAGSTART((char *) tag_name));
- add_assoc_string(tag,"tag",SKIP_TAGSTART((char *) tag_name),1);
- add_assoc_string(tag,"type","open",1);
- add_assoc_long(tag,"level",parser->level);
- parser->ltags[parser->level-1] = estrdup(tag_name);
- parser->lastwasopen = 1;
- attributes = (const XML_Char **) attrs;
- while (attributes && *attributes) {
- att = _xml_decode_tag(parser, attributes[0]);
- val = xml_utf8_decode(attributes[1], strlen(attributes[1]), &val_len, parser->target_encoding);
- add_assoc_stringl(atr,att,val,val_len,0);
- atcnt++;
- attributes += 2;
- efree(att);
- }
- if (atcnt) {
- zend_hash_add(Z_ARRVAL_P(tag),"attributes",sizeof("attributes"),&atr,sizeof(zval*),NULL);
- } else {
- zval_ptr_dtor(&atr);
- }
- zend_hash_next_index_insert(Z_ARRVAL_P(parser->data),&tag,sizeof(zval*),(void *) &parser->ctag);
- } else if (parser->level == (XML_MAXLEVEL + 1)) {
- TSRMLS_FETCH();
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Maximum depth exceeded - Results truncated");
- }
- }
- efree(tag_name);
- }
- }
- /* }}} */
- /* {{{ _xml_endElementHandler() */
- void _xml_endElementHandler(void *userData, const XML_Char *name)
- {
- xml_parser *parser = (xml_parser *)userData;
- char *tag_name;
- if (parser) {
- zval *retval, *args[2];
- tag_name = _xml_decode_tag(parser, name);
- if (parser->endElementHandler) {
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_string_zval(SKIP_TAGSTART((char *) tag_name));
- if ((retval = xml_call_handler(parser, parser->endElementHandler, parser->endElementPtr, 2, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- if (parser->data) {
- zval *tag;
- if (parser->lastwasopen) {
- add_assoc_string(*(parser->ctag),"type","complete",1);
- } else {
- MAKE_STD_ZVAL(tag);
- array_init(tag);
- _xml_add_to_info(parser,SKIP_TAGSTART((char *) tag_name));
- add_assoc_string(tag,"tag",SKIP_TAGSTART((char *) tag_name),1);
- add_assoc_string(tag,"type","close",1);
- add_assoc_long(tag,"level",parser->level);
- zend_hash_next_index_insert(Z_ARRVAL_P(parser->data),&tag,sizeof(zval*),NULL);
- }
- parser->lastwasopen = 0;
- }
- efree(tag_name);
- if ((parser->ltags) && (parser->level <= XML_MAXLEVEL)) {
- efree(parser->ltags[parser->level-1]);
- }
- parser->level--;
- }
- }
- /* }}} */
- /* {{{ _xml_characterDataHandler() */
- void _xml_characterDataHandler(void *userData, const XML_Char *s, int len)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser) {
- zval *retval, *args[2];
- if (parser->characterDataHandler) {
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(s, len, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->characterDataHandler, parser->characterDataPtr, 2, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- if (parser->data) {
- int i;
- int doprint = 0;
- char *decoded_value;
- int decoded_len;
- decoded_value = xml_utf8_decode(s,len,&decoded_len,parser->target_encoding);
- for (i = 0; i < decoded_len; i++) {
- switch (decoded_value[i]) {
- case ' ':
- case '\t':
- case '\n':
- continue;
- default:
- doprint = 1;
- break;
- }
- if (doprint) {
- break;
- }
- }
- if (doprint || (! parser->skipwhite)) {
- if (parser->lastwasopen) {
- zval **myval;
- /* check if the current tag already has a value - if yes append to that! */
- if (zend_hash_find(Z_ARRVAL_PP(parser->ctag),"value",sizeof("value"),(void **) &myval) == SUCCESS) {
- int newlen = Z_STRLEN_PP(myval) + decoded_len;
- Z_STRVAL_PP(myval) = erealloc(Z_STRVAL_PP(myval),newlen+1);
- strncpy(Z_STRVAL_PP(myval) + Z_STRLEN_PP(myval), decoded_value, decoded_len + 1);
- Z_STRLEN_PP(myval) += decoded_len;
- efree(decoded_value);
- } else {
- add_assoc_string(*(parser->ctag),"value",decoded_value,0);
- }
- } else {
- zval *tag;
- zval **curtag, **mytype, **myval;
- HashPosition hpos=NULL;
- zend_hash_internal_pointer_end_ex(Z_ARRVAL_P(parser->data), &hpos);
- if (hpos && (zend_hash_get_current_data_ex(Z_ARRVAL_P(parser->data), (void **) &curtag, &hpos) == SUCCESS)) {
- if (zend_hash_find(Z_ARRVAL_PP(curtag),"type",sizeof("type"),(void **) &mytype) == SUCCESS) {
- if (!strcmp(Z_STRVAL_PP(mytype), "cdata")) {
- if (zend_hash_find(Z_ARRVAL_PP(curtag),"value",sizeof("value"),(void **) &myval) == SUCCESS) {
- int newlen = Z_STRLEN_PP(myval) + decoded_len;
- Z_STRVAL_PP(myval) = erealloc(Z_STRVAL_PP(myval),newlen+1);
- strncpy(Z_STRVAL_PP(myval) + Z_STRLEN_PP(myval), decoded_value, decoded_len + 1);
- Z_STRLEN_PP(myval) += decoded_len;
- efree(decoded_value);
- return;
- }
- }
- }
- }
- if (parser->level <= XML_MAXLEVEL && parser->level > 0) {
- MAKE_STD_ZVAL(tag);
- array_init(tag);
- _xml_add_to_info(parser,SKIP_TAGSTART(parser->ltags[parser->level-1]));
- add_assoc_string(tag,"tag",SKIP_TAGSTART(parser->ltags[parser->level-1]),1);
- add_assoc_string(tag,"value",decoded_value,0);
- add_assoc_string(tag,"type","cdata",1);
- add_assoc_long(tag,"level",parser->level);
- zend_hash_next_index_insert(Z_ARRVAL_P(parser->data),&tag,sizeof(zval*),NULL);
- } else if (parser->level == (XML_MAXLEVEL + 1)) {
- TSRMLS_FETCH();
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Maximum depth exceeded - Results truncated");
- }
- }
- } else {
- efree(decoded_value);
- }
- }
- }
- }
- /* }}} */
- /* {{{ _xml_processingInstructionHandler() */
- void _xml_processingInstructionHandler(void *userData, const XML_Char *target, const XML_Char *data)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->processingInstructionHandler) {
- zval *retval, *args[3];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(target, 0, parser->target_encoding);
- args[2] = _xml_xmlchar_zval(data, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->processingInstructionHandler, parser->processingInstructionPtr, 3, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /* {{{ _xml_defaultHandler() */
- void _xml_defaultHandler(void *userData, const XML_Char *s, int len)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->defaultHandler) {
- zval *retval, *args[2];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(s, len, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->defaultHandler, parser->defaultPtr, 2, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /* {{{ _xml_unparsedEntityDeclHandler() */
- void _xml_unparsedEntityDeclHandler(void *userData,
- const XML_Char *entityName,
- const XML_Char *base,
- const XML_Char *systemId,
- const XML_Char *publicId,
- const XML_Char *notationName)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->unparsedEntityDeclHandler) {
- zval *retval, *args[6];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(entityName, 0, parser->target_encoding);
- args[2] = _xml_xmlchar_zval(base, 0, parser->target_encoding);
- args[3] = _xml_xmlchar_zval(systemId, 0, parser->target_encoding);
- args[4] = _xml_xmlchar_zval(publicId, 0, parser->target_encoding);
- args[5] = _xml_xmlchar_zval(notationName, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->unparsedEntityDeclHandler, parser->unparsedEntityDeclPtr, 6, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /* {{{ _xml_notationDeclHandler() */
- void _xml_notationDeclHandler(void *userData,
- const XML_Char *notationName,
- const XML_Char *base,
- const XML_Char *systemId,
- const XML_Char *publicId)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->notationDeclHandler) {
- zval *retval, *args[5];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(notationName, 0, parser->target_encoding);
- args[2] = _xml_xmlchar_zval(base, 0, parser->target_encoding);
- args[3] = _xml_xmlchar_zval(systemId, 0, parser->target_encoding);
- args[4] = _xml_xmlchar_zval(publicId, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->notationDeclHandler, parser->notationDeclPtr, 5, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /* {{{ _xml_externalEntityRefHandler() */
- int _xml_externalEntityRefHandler(XML_Parser parserPtr,
- const XML_Char *openEntityNames,
- const XML_Char *base,
- const XML_Char *systemId,
- const XML_Char *publicId)
- {
- xml_parser *parser = XML_GetUserData(parserPtr);
- int ret = 0; /* abort if no handler is set (should be configurable?) */
- if (parser && parser->externalEntityRefHandler) {
- zval *retval, *args[5];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(openEntityNames, 0, parser->target_encoding);
- args[2] = _xml_xmlchar_zval(base, 0, parser->target_encoding);
- args[3] = _xml_xmlchar_zval(systemId, 0, parser->target_encoding);
- args[4] = _xml_xmlchar_zval(publicId, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->externalEntityRefHandler, parser->externalEntityRefPtr, 5, args))) {
- convert_to_long(retval);
- ret = Z_LVAL_P(retval);
- efree(retval);
- } else {
- ret = 0;
- }
- }
- return ret;
- }
- /* }}} */
- /* {{{ _xml_startNamespaceDeclHandler() */
- void _xml_startNamespaceDeclHandler(void *userData,const XML_Char *prefix, const XML_Char *uri)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->startNamespaceDeclHandler) {
- zval *retval, *args[3];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(prefix, 0, parser->target_encoding);
- args[2] = _xml_xmlchar_zval(uri, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->startNamespaceDeclHandler, parser->startNamespaceDeclPtr, 3, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /* {{{ _xml_endNamespaceDeclHandler() */
- void _xml_endNamespaceDeclHandler(void *userData, const XML_Char *prefix)
- {
- xml_parser *parser = (xml_parser *)userData;
- if (parser && parser->endNamespaceDeclHandler) {
- zval *retval, *args[2];
- args[0] = _xml_resource_zval(parser->index);
- args[1] = _xml_xmlchar_zval(prefix, 0, parser->target_encoding);
- if ((retval = xml_call_handler(parser, parser->endNamespaceDeclHandler, parser->endNamespaceDeclPtr, 2, args))) {
- zval_ptr_dtor(&retval);
- }
- }
- }
- /* }}} */
- /************************* EXTENSION FUNCTIONS *************************/
- static void php_xml_parser_create_impl(INTERNAL_FUNCTION_PARAMETERS, int ns_support) /* {{{ */
- {
- xml_parser *parser;
- int auto_detect = 0;
- char *encoding_param = NULL;
- int encoding_param_len = 0;
- char *ns_param = NULL;
- int ns_param_len = 0;
- XML_Char *encoding;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, (ns_support ? "|ss": "|s"), &encoding_param, &encoding_param_len, &ns_param, &ns_param_len) == FAILURE) {
- RETURN_FALSE;
- }
- if (encoding_param != NULL) {
- /* The supported encoding types are hardcoded here because
- * we are limited to the encodings supported by expat/xmltok.
- */
- if (encoding_param_len == 0) {
- encoding = XML(default_encoding);
- auto_detect = 1;
- } else if (strcasecmp(encoding_param, "ISO-8859-1") == 0) {
- encoding = "ISO-8859-1";
- } else if (strcasecmp(encoding_param, "UTF-8") == 0) {
- encoding = "UTF-8";
- } else if (strcasecmp(encoding_param, "US-ASCII") == 0) {
- encoding = "US-ASCII";
- } else {
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "unsupported source encoding \"%s\"", encoding_param);
- RETURN_FALSE;
- }
- } else {
- encoding = XML(default_encoding);
- }
- if (ns_support && ns_param == NULL){
- ns_param = ":";
- }
- parser = ecalloc(1, sizeof(xml_parser));
- parser->parser = XML_ParserCreate_MM((auto_detect ? NULL : encoding),
- &php_xml_mem_hdlrs, ns_param);
- parser->target_encoding = encoding;
- parser->case_folding = 1;
- parser->object = NULL;
- parser->isparsing = 0;
- XML_SetUserData(parser->parser, parser);
- ZEND_REGISTER_RESOURCE(return_value, parser,le_xml_parser);
- parser->index = Z_LVAL_P(return_value);
- }
- /* }}} */
- /* {{{ proto resource xml_parser_create([string encoding])
- Create an XML parser */
- PHP_FUNCTION(xml_parser_create)
- {
- php_xml_parser_create_impl(INTERNAL_FUNCTION_PARAM_PASSTHRU, 0);
- }
- /* }}} */
- /* {{{ proto resource xml_parser_create_ns([string encoding [, string sep]])
- Create an XML parser */
- PHP_FUNCTION(xml_parser_create_ns)
- {
- php_xml_parser_create_impl(INTERNAL_FUNCTION_PARAM_PASSTHRU, 1);
- }
- /* }}} */
- /* {{{ proto int xml_set_object(resource parser, object &obj)
- Set up object which should be used for callbacks */
- PHP_FUNCTION(xml_set_object)
- {
- xml_parser *parser;
- zval *pind, *mythis;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "ro", &pind, &mythis) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- /* please leave this commented - or ask thies@thieso.net before doing it (again) */
- if (parser->object) {
- zval_ptr_dtor(&parser->object);
- }
- /* please leave this commented - or ask thies@thieso.net before doing it (again) */
- /* #ifdef ZEND_ENGINE_2
- zval_add_ref(&parser->object);
- #endif */
- ALLOC_ZVAL(parser->object);
- MAKE_COPY_ZVAL(&mythis, parser->object);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_element_handler(resource parser, string shdl, string ehdl)
- Set up start and end element handlers */
- PHP_FUNCTION(xml_set_element_handler)
- {
- xml_parser *parser;
- zval *pind, **shdl, **ehdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZZ", &pind, &shdl, &ehdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->startElementHandler, shdl);
- xml_set_handler(&parser->endElementHandler, ehdl);
- XML_SetElementHandler(parser->parser, _xml_startElementHandler, _xml_endElementHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_character_data_handler(resource parser, string hdl)
- Set up character data handler */
- PHP_FUNCTION(xml_set_character_data_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->characterDataHandler, hdl);
- XML_SetCharacterDataHandler(parser->parser, _xml_characterDataHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_processing_instruction_handler(resource parser, string hdl)
- Set up processing instruction (PI) handler */
- PHP_FUNCTION(xml_set_processing_instruction_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->processingInstructionHandler, hdl);
- XML_SetProcessingInstructionHandler(parser->parser, _xml_processingInstructionHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_default_handler(resource parser, string hdl)
- Set up default handler */
- PHP_FUNCTION(xml_set_default_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->defaultHandler, hdl);
- XML_SetDefaultHandler(parser->parser, _xml_defaultHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_unparsed_entity_decl_handler(resource parser, string hdl)
- Set up unparsed entity declaration handler */
- PHP_FUNCTION(xml_set_unparsed_entity_decl_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->unparsedEntityDeclHandler, hdl);
- XML_SetUnparsedEntityDeclHandler(parser->parser, _xml_unparsedEntityDeclHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_notation_decl_handler(resource parser, string hdl)
- Set up notation declaration handler */
- PHP_FUNCTION(xml_set_notation_decl_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->notationDeclHandler, hdl);
- XML_SetNotationDeclHandler(parser->parser, _xml_notationDeclHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_external_entity_ref_handler(resource parser, string hdl)
- Set up external entity reference handler */
- PHP_FUNCTION(xml_set_external_entity_ref_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->externalEntityRefHandler, hdl);
- XML_SetExternalEntityRefHandler(parser->parser, (void *) _xml_externalEntityRefHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_start_namespace_decl_handler(resource parser, string hdl)
- Set up character data handler */
- PHP_FUNCTION(xml_set_start_namespace_decl_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->startNamespaceDeclHandler, hdl);
- XML_SetStartNamespaceDeclHandler(parser->parser, _xml_startNamespaceDeclHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_set_end_namespace_decl_handler(resource parser, string hdl)
- Set up character data handler */
- PHP_FUNCTION(xml_set_end_namespace_decl_handler)
- {
- xml_parser *parser;
- zval *pind, **hdl;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rZ", &pind, &hdl) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- xml_set_handler(&parser->endNamespaceDeclHandler, hdl);
- XML_SetEndNamespaceDeclHandler(parser->parser, _xml_endNamespaceDeclHandler);
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_parse(resource parser, string data [, int isFinal])
- Start parsing an XML document */
- PHP_FUNCTION(xml_parse)
- {
- xml_parser *parser;
- zval *pind;
- char *data;
- int data_len, ret;
- long isFinal = 0;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rs|l", &pind, &data, &data_len, &isFinal) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- parser->isparsing = 1;
- ret = XML_Parse(parser->parser, data, data_len, isFinal);
- parser->isparsing = 0;
- RETVAL_LONG(ret);
- }
- /* }}} */
- /* {{{ proto int xml_parse_into_struct(resource parser, string data, array &values [, array &index ])
- Parsing a XML document */
- PHP_FUNCTION(xml_parse_into_struct)
- {
- xml_parser *parser;
- zval *pind, **xdata, **info = NULL;
- char *data;
- int data_len, ret;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rsZ|Z", &pind, &data, &data_len, &xdata, &info) == FAILURE) {
- return;
- }
- if (info) {
- zval_dtor(*info);
- array_init(*info);
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- zval_dtor(*xdata);
- array_init(*xdata);
- parser->data = *xdata;
- if (info) {
- parser->info = *info;
- }
- parser->level = 0;
- parser->ltags = safe_emalloc(XML_MAXLEVEL, sizeof(char *), 0);
- XML_SetDefaultHandler(parser->parser, _xml_defaultHandler);
- XML_SetElementHandler(parser->parser, _xml_startElementHandler, _xml_endElementHandler);
- XML_SetCharacterDataHandler(parser->parser, _xml_characterDataHandler);
- parser->isparsing = 1;
- ret = XML_Parse(parser->parser, data, data_len, 1);
- parser->isparsing = 0;
- RETVAL_LONG(ret);
- }
- /* }}} */
- /* {{{ proto int xml_get_error_code(resource parser)
- Get XML parser error code */
- PHP_FUNCTION(xml_get_error_code)
- {
- xml_parser *parser;
- zval *pind;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "r", &pind) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- RETVAL_LONG((long)XML_GetErrorCode(parser->parser));
- }
- /* }}} */
- /* {{{ proto string xml_error_string(int code)
- Get XML parser error string */
- PHP_FUNCTION(xml_error_string)
- {
- long code;
- char *str;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "l", &code) == FAILURE) {
- return;
- }
- str = (char *)XML_ErrorString((int)code);
- if (str) {
- RETVAL_STRING(str, 1);
- }
- }
- /* }}} */
- /* {{{ proto int xml_get_current_line_number(resource parser)
- Get current line number for an XML parser */
- PHP_FUNCTION(xml_get_current_line_number)
- {
- xml_parser *parser;
- zval *pind;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "r", &pind) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- RETVAL_LONG(XML_GetCurrentLineNumber(parser->parser));
- }
- /* }}} */
- /* {{{ proto int xml_get_current_column_number(resource parser)
- Get current column number for an XML parser */
- PHP_FUNCTION(xml_get_current_column_number)
- {
- xml_parser *parser;
- zval *pind;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "r", &pind) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- RETVAL_LONG(XML_GetCurrentColumnNumber(parser->parser));
- }
- /* }}} */
- /* {{{ proto int xml_get_current_byte_index(resource parser)
- Get current byte index for an XML parser */
- PHP_FUNCTION(xml_get_current_byte_index)
- {
- xml_parser *parser;
- zval *pind;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "r", &pind) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- RETVAL_LONG(XML_GetCurrentByteIndex(parser->parser));
- }
- /* }}} */
- /* {{{ proto int xml_parser_free(resource parser)
- Free an XML parser */
- PHP_FUNCTION(xml_parser_free)
- {
- zval *pind;
- xml_parser *parser;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "r", &pind) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- if (parser->isparsing == 1) {
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Parser cannot be freed while it is parsing.");
- RETURN_FALSE;
- }
- if (zend_list_delete(parser->index) == FAILURE) {
- RETURN_FALSE;
- }
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_parser_set_option(resource parser, int option, mixed value)
- Set options in an XML parser */
- PHP_FUNCTION(xml_parser_set_option)
- {
- xml_parser *parser;
- zval *pind, **val;
- long opt;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rlZ", &pind, &opt, &val) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- switch (opt) {
- case PHP_XML_OPTION_CASE_FOLDING:
- convert_to_long_ex(val);
- parser->case_folding = Z_LVAL_PP(val);
- break;
- case PHP_XML_OPTION_SKIP_TAGSTART:
- convert_to_long_ex(val);
- parser->toffset = Z_LVAL_PP(val);
- if (parser->toffset < 0) {
- php_error_docref(NULL TSRMLS_CC, E_NOTICE, "tagstart ignored, because it is out of range");
- parser->toffset = 0;
- }
- break;
- case PHP_XML_OPTION_SKIP_WHITE:
- convert_to_long_ex(val);
- parser->skipwhite = Z_LVAL_PP(val);
- break;
- case PHP_XML_OPTION_TARGET_ENCODING: {
- xml_encoding *enc;
- convert_to_string_ex(val);
- enc = xml_get_encoding(Z_STRVAL_PP(val));
- if (enc == NULL) {
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unsupported target encoding \"%s\"", Z_STRVAL_PP(val));
- RETURN_FALSE;
- }
- parser->target_encoding = enc->name;
- break;
- }
- default:
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unknown option");
- RETURN_FALSE;
- break;
- }
- RETVAL_TRUE;
- }
- /* }}} */
- /* {{{ proto int xml_parser_get_option(resource parser, int option)
- Get options from an XML parser */
- PHP_FUNCTION(xml_parser_get_option)
- {
- xml_parser *parser;
- zval *pind;
- long opt;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "rl", &pind, &opt) == FAILURE) {
- return;
- }
- ZEND_FETCH_RESOURCE(parser,xml_parser *, &pind, -1, "XML Parser", le_xml_parser);
- switch (opt) {
- case PHP_XML_OPTION_CASE_FOLDING:
- RETURN_LONG(parser->case_folding);
- break;
- case PHP_XML_OPTION_TARGET_ENCODING:
- RETURN_STRING(parser->target_encoding, 1);
- break;
- default:
- php_error_docref(NULL TSRMLS_CC, E_WARNING, "Unknown option");
- RETURN_FALSE;
- break;
- }
- RETVAL_FALSE; /* never reached */
- }
- /* }}} */
- /* {{{ proto string utf8_encode(string data)
- Encodes an ISO-8859-1 string to UTF-8 */
- PHP_FUNCTION(utf8_encode)
- {
- char *arg;
- XML_Char *encoded;
- int arg_len, len;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s", &arg, &arg_len) == FAILURE) {
- return;
- }
- encoded = xml_utf8_encode(arg, arg_len, &len, "ISO-8859-1");
- if (encoded == NULL) {
- RETURN_FALSE;
- }
- RETVAL_STRINGL(encoded, len, 0);
- }
- /* }}} */
- /* {{{ proto string utf8_decode(string data)
- Converts a UTF-8 encoded string to ISO-8859-1 */
- PHP_FUNCTION(utf8_decode)
- {
- char *arg;
- XML_Char *decoded;
- int arg_len, len;
- if (zend_parse_parameters(ZEND_NUM_ARGS() TSRMLS_CC, "s", &arg, &arg_len) == FAILURE) {
- return;
- }
- decoded = xml_utf8_decode(arg, arg_len, &len, "ISO-8859-1");
- if (decoded == NULL) {
- RETURN_FALSE;
- }
- RETVAL_STRINGL(decoded, len, 0);
- }
- /* }}} */
- #endif
- /*
- * Local variables:
- * tab-width: 4
- * c-basic-offset: 4
- * End:
- * vim600: sw=4 ts=4 fdm=marker
- * vim<600: sw=4 ts=4
- */
|