php_xml.c 7.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329
  1. /*
  2. +----------------------------------------------------------------------+
  3. | PHP Version 7 |
  4. +----------------------------------------------------------------------+
  5. | Copyright (c) 1997-2018 The PHP Group |
  6. +----------------------------------------------------------------------+
  7. | This source file is subject to version 3.01 of the PHP license, |
  8. | that is bundled with this package in the file LICENSE, and is |
  9. | available through the world-wide-web at the following url: |
  10. | http://www.php.net/license/3_01.txt |
  11. | If you did not receive a copy of the PHP license and are unable to |
  12. | obtain it through the world-wide-web, please send a note to |
  13. | license@php.net so we can mail you a copy immediately. |
  14. +----------------------------------------------------------------------+
  15. | Authors: Brad Lafountain <rodif_bl@yahoo.com> |
  16. | Shane Caraveo <shane@caraveo.com> |
  17. | Dmitry Stogov <dmitry@php.net> |
  18. +----------------------------------------------------------------------+
  19. */
  20. #include "php_soap.h"
  21. #include "ext/libxml/php_libxml.h"
  22. #include "libxml/parser.h"
  23. #include "libxml/parserInternals.h"
  24. /* Channel libxml file io layer through the PHP streams subsystem.
  25. * This allows use of ftps:// and https:// urls */
  26. static int is_blank(const xmlChar* str)
  27. {
  28. while (*str != '\0') {
  29. if (*str != ' ' && *str != 0x9 && *str != 0xa && *str != 0xd) {
  30. return 0;
  31. }
  32. str++;
  33. }
  34. return 1;
  35. }
  36. /* removes all empty text, comments and other insignoficant nodes */
  37. static void cleanup_xml_node(xmlNodePtr node)
  38. {
  39. xmlNodePtr trav;
  40. xmlNodePtr del = NULL;
  41. trav = node->children;
  42. while (trav != NULL) {
  43. if (del != NULL) {
  44. xmlUnlinkNode(del);
  45. xmlFreeNode(del);
  46. del = NULL;
  47. }
  48. if (trav->type == XML_TEXT_NODE) {
  49. if (is_blank(trav->content)) {
  50. del = trav;
  51. }
  52. } else if ((trav->type != XML_ELEMENT_NODE) &&
  53. (trav->type != XML_CDATA_SECTION_NODE)) {
  54. del = trav;
  55. } else if (trav->children != NULL) {
  56. cleanup_xml_node(trav);
  57. }
  58. trav = trav->next;
  59. }
  60. if (del != NULL) {
  61. xmlUnlinkNode(del);
  62. xmlFreeNode(del);
  63. }
  64. }
  65. static void soap_ignorableWhitespace(void *ctx, const xmlChar *ch, int len)
  66. {
  67. }
  68. static void soap_Comment(void *ctx, const xmlChar *value)
  69. {
  70. }
  71. xmlDocPtr soap_xmlParseFile(const char *filename)
  72. {
  73. xmlParserCtxtPtr ctxt = NULL;
  74. xmlDocPtr ret;
  75. zend_bool old_allow_url_fopen;
  76. /*
  77. xmlInitParser();
  78. */
  79. old_allow_url_fopen = PG(allow_url_fopen);
  80. PG(allow_url_fopen) = 1;
  81. ctxt = xmlCreateFileParserCtxt(filename);
  82. PG(allow_url_fopen) = old_allow_url_fopen;
  83. if (ctxt) {
  84. zend_bool old;
  85. ctxt->keepBlanks = 0;
  86. ctxt->sax->ignorableWhitespace = soap_ignorableWhitespace;
  87. ctxt->sax->comment = soap_Comment;
  88. ctxt->sax->warning = NULL;
  89. ctxt->sax->error = NULL;
  90. /*ctxt->sax->fatalError = NULL;*/
  91. #if LIBXML_VERSION >= 20703
  92. ctxt->options |= XML_PARSE_HUGE;
  93. #endif
  94. old = php_libxml_disable_entity_loader(1);
  95. xmlParseDocument(ctxt);
  96. php_libxml_disable_entity_loader(old);
  97. if (ctxt->wellFormed) {
  98. ret = ctxt->myDoc;
  99. if (ret->URL == NULL && ctxt->directory != NULL) {
  100. ret->URL = xmlCharStrdup(ctxt->directory);
  101. }
  102. } else {
  103. ret = NULL;
  104. xmlFreeDoc(ctxt->myDoc);
  105. ctxt->myDoc = NULL;
  106. }
  107. xmlFreeParserCtxt(ctxt);
  108. } else {
  109. ret = NULL;
  110. }
  111. /*
  112. xmlCleanupParser();
  113. */
  114. if (ret) {
  115. cleanup_xml_node((xmlNodePtr)ret);
  116. }
  117. return ret;
  118. }
  119. xmlDocPtr soap_xmlParseMemory(const void *buf, size_t buf_size)
  120. {
  121. xmlParserCtxtPtr ctxt = NULL;
  122. xmlDocPtr ret;
  123. /*
  124. xmlInitParser();
  125. */
  126. ctxt = xmlCreateMemoryParserCtxt(buf, buf_size);
  127. if (ctxt) {
  128. zend_bool old;
  129. ctxt->sax->ignorableWhitespace = soap_ignorableWhitespace;
  130. ctxt->sax->comment = soap_Comment;
  131. ctxt->sax->warning = NULL;
  132. ctxt->sax->error = NULL;
  133. /*ctxt->sax->fatalError = NULL;*/
  134. #if LIBXML_VERSION >= 20703
  135. ctxt->options |= XML_PARSE_HUGE;
  136. #endif
  137. old = php_libxml_disable_entity_loader(1);
  138. xmlParseDocument(ctxt);
  139. php_libxml_disable_entity_loader(old);
  140. if (ctxt->wellFormed) {
  141. ret = ctxt->myDoc;
  142. if (ret->URL == NULL && ctxt->directory != NULL) {
  143. ret->URL = xmlCharStrdup(ctxt->directory);
  144. }
  145. } else {
  146. ret = NULL;
  147. xmlFreeDoc(ctxt->myDoc);
  148. ctxt->myDoc = NULL;
  149. }
  150. xmlFreeParserCtxt(ctxt);
  151. } else {
  152. ret = NULL;
  153. }
  154. /*
  155. xmlCleanupParser();
  156. */
  157. /*
  158. if (ret) {
  159. cleanup_xml_node((xmlNodePtr)ret);
  160. }
  161. */
  162. return ret;
  163. }
  164. xmlNsPtr attr_find_ns(xmlAttrPtr node)
  165. {
  166. if (node->ns) {
  167. return node->ns;
  168. } else if (node->parent->ns) {
  169. return node->parent->ns;
  170. } else {
  171. return xmlSearchNs(node->doc, node->parent, NULL);
  172. }
  173. }
  174. xmlNsPtr node_find_ns(xmlNodePtr node)
  175. {
  176. if (node->ns) {
  177. return node->ns;
  178. } else {
  179. return xmlSearchNs(node->doc, node, NULL);
  180. }
  181. }
  182. int attr_is_equal_ex(xmlAttrPtr node, char *name, char *ns)
  183. {
  184. if (name == NULL || ((node->name) && strcmp((char*)node->name, name) == 0)) {
  185. if (ns) {
  186. xmlNsPtr nsPtr = attr_find_ns(node);
  187. if (nsPtr) {
  188. return (strcmp((char*)nsPtr->href, ns) == 0);
  189. } else {
  190. return FALSE;
  191. }
  192. }
  193. return TRUE;
  194. }
  195. return FALSE;
  196. }
  197. int node_is_equal_ex(xmlNodePtr node, char *name, char *ns)
  198. {
  199. if (name == NULL || ((node->name) && strcmp((char*)node->name, name) == 0)) {
  200. if (ns) {
  201. xmlNsPtr nsPtr = node_find_ns(node);
  202. if (nsPtr) {
  203. return (strcmp((char*)nsPtr->href, ns) == 0);
  204. } else {
  205. return FALSE;
  206. }
  207. }
  208. return TRUE;
  209. }
  210. return FALSE;
  211. }
  212. xmlAttrPtr get_attribute_ex(xmlAttrPtr node, char *name, char *ns)
  213. {
  214. while (node!=NULL) {
  215. if (attr_is_equal_ex(node, name, ns)) {
  216. return node;
  217. }
  218. node = node->next;
  219. }
  220. return NULL;
  221. }
  222. xmlNodePtr get_node_ex(xmlNodePtr node, char *name, char *ns)
  223. {
  224. while (node!=NULL) {
  225. if (node_is_equal_ex(node, name, ns)) {
  226. return node;
  227. }
  228. node = node->next;
  229. }
  230. return NULL;
  231. }
  232. xmlNodePtr get_node_recurisve_ex(xmlNodePtr node, char *name, char *ns)
  233. {
  234. while (node != NULL) {
  235. if (node_is_equal_ex(node, name, ns)) {
  236. return node;
  237. } else if (node->children != NULL) {
  238. xmlNodePtr tmp = get_node_recurisve_ex(node->children, name, ns);
  239. if (tmp) {
  240. return tmp;
  241. }
  242. }
  243. node = node->next;
  244. }
  245. return NULL;
  246. }
  247. xmlNodePtr get_node_with_attribute_ex(xmlNodePtr node, char *name, char *name_ns, char *attribute, char *value, char *attr_ns)
  248. {
  249. xmlAttrPtr attr;
  250. while (node != NULL) {
  251. if (name != NULL) {
  252. node = get_node_ex(node, name, name_ns);
  253. if (node==NULL) {
  254. return NULL;
  255. }
  256. }
  257. attr = get_attribute_ex(node->properties, attribute, attr_ns);
  258. if (attr != NULL && strcmp((char*)attr->children->content, value) == 0) {
  259. return node;
  260. }
  261. node = node->next;
  262. }
  263. return NULL;
  264. }
  265. xmlNodePtr get_node_with_attribute_recursive_ex(xmlNodePtr node, char *name, char *name_ns, char *attribute, char *value, char *attr_ns)
  266. {
  267. while (node != NULL) {
  268. if (node_is_equal_ex(node, name, name_ns)) {
  269. xmlAttrPtr attr = get_attribute_ex(node->properties, attribute, attr_ns);
  270. if (attr != NULL && strcmp((char*)attr->children->content, value) == 0) {
  271. return node;
  272. }
  273. }
  274. if (node->children != NULL) {
  275. xmlNodePtr tmp = get_node_with_attribute_recursive_ex(node->children, name, name_ns, attribute, value, attr_ns);
  276. if (tmp) {
  277. return tmp;
  278. }
  279. }
  280. node = node->next;
  281. }
  282. return NULL;
  283. }
  284. int parse_namespace(const xmlChar *inval, char **value, char **namespace)
  285. {
  286. char *found = strrchr((char*)inval, ':');
  287. if (found != NULL && found != (char*)inval) {
  288. (*namespace) = estrndup((char*)inval, found - (char*)inval);
  289. (*value) = estrdup(++found);
  290. } else {
  291. (*value) = estrdup((char*)inval);
  292. (*namespace) = NULL;
  293. }
  294. return FALSE;
  295. }