pdo_sql_parser.re 14 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523
  1. /*
  2. +----------------------------------------------------------------------+
  3. | PHP Version 5 |
  4. +----------------------------------------------------------------------+
  5. | Copyright (c) 1997-2016 The PHP Group |
  6. +----------------------------------------------------------------------+
  7. | This source file is subject to version 3.01 of the PHP license, |
  8. | that is bundled with this package in the file LICENSE, and is |
  9. | available through the world-wide-web at the following url: |
  10. | http://www.php.net/license/3_01.txt |
  11. | If you did not receive a copy of the PHP license and are unable to |
  12. | obtain it through the world-wide-web, please send a note to |
  13. | license@php.net so we can mail you a copy immediately. |
  14. +----------------------------------------------------------------------+
  15. | Author: George Schlossnagle <george@omniti.com> |
  16. +----------------------------------------------------------------------+
  17. */
  18. /* $Id$ */
  19. #include "php.h"
  20. #include "php_pdo_driver.h"
  21. #include "php_pdo_int.h"
  22. #define PDO_PARSER_TEXT 1
  23. #define PDO_PARSER_BIND 2
  24. #define PDO_PARSER_BIND_POS 3
  25. #define PDO_PARSER_EOI 4
  26. #define RET(i) {s->cur = cursor; return i; }
  27. #define SKIP_ONE(i) {s->cur = s->tok + 1; return i; }
  28. #define YYCTYPE unsigned char
  29. #define YYCURSOR cursor
  30. #define YYLIMIT s->end
  31. #define YYMARKER s->ptr
  32. #define YYFILL(n) { RET(PDO_PARSER_EOI); }
  33. typedef struct Scanner {
  34. char *ptr, *cur, *tok, *end;
  35. } Scanner;
  36. static int scan(Scanner *s)
  37. {
  38. char *cursor = s->cur;
  39. s->tok = cursor;
  40. /*!re2c
  41. BINDCHR = [:][a-zA-Z0-9_]+;
  42. QUESTION = [?];
  43. COMMENTS = ("/*"([^*]+|[*]+[^/*])*[*]*"*/"|"--"[^\r\n]*);
  44. SPECIALS = [:?"'-/];
  45. MULTICHAR = ([:]{2,}|[?]{2,});
  46. ANYNOEOF = [\001-\377];
  47. */
  48. /*!re2c
  49. (["](([\\]ANYNOEOF)|ANYNOEOF\["\\])*["]) { RET(PDO_PARSER_TEXT); }
  50. (['](([\\]ANYNOEOF)|ANYNOEOF\['\\])*[']) { RET(PDO_PARSER_TEXT); }
  51. MULTICHAR { RET(PDO_PARSER_TEXT); }
  52. BINDCHR { RET(PDO_PARSER_BIND); }
  53. QUESTION { RET(PDO_PARSER_BIND_POS); }
  54. SPECIALS { SKIP_ONE(PDO_PARSER_TEXT); }
  55. COMMENTS { RET(PDO_PARSER_TEXT); }
  56. (ANYNOEOF\SPECIALS)+ { RET(PDO_PARSER_TEXT); }
  57. */
  58. }
  59. struct placeholder {
  60. char *pos;
  61. int len;
  62. int bindno;
  63. int qlen; /* quoted length of value */
  64. char *quoted; /* quoted value */
  65. int freeq;
  66. struct placeholder *next;
  67. };
  68. PDO_API int pdo_parse_params(pdo_stmt_t *stmt, char *inquery, int inquery_len,
  69. char **outquery, int *outquery_len TSRMLS_DC)
  70. {
  71. Scanner s;
  72. char *ptr, *newbuffer;
  73. int t;
  74. int bindno = 0;
  75. int ret = 0;
  76. int newbuffer_len;
  77. HashTable *params;
  78. struct pdo_bound_param_data *param;
  79. int query_type = PDO_PLACEHOLDER_NONE;
  80. struct placeholder *placeholders = NULL, *placetail = NULL, *plc = NULL;
  81. ptr = *outquery;
  82. s.cur = inquery;
  83. s.end = inquery + inquery_len + 1;
  84. /* phase 1: look for args */
  85. while((t = scan(&s)) != PDO_PARSER_EOI) {
  86. if (t == PDO_PARSER_BIND || t == PDO_PARSER_BIND_POS) {
  87. if (t == PDO_PARSER_BIND) {
  88. int len = s.cur - s.tok;
  89. if ((inquery < (s.cur - len)) && isalnum(*(s.cur - len - 1))) {
  90. continue;
  91. }
  92. query_type |= PDO_PLACEHOLDER_NAMED;
  93. } else {
  94. query_type |= PDO_PLACEHOLDER_POSITIONAL;
  95. }
  96. plc = emalloc(sizeof(*plc));
  97. memset(plc, 0, sizeof(*plc));
  98. plc->next = NULL;
  99. plc->pos = s.tok;
  100. plc->len = s.cur - s.tok;
  101. plc->bindno = bindno++;
  102. if (placetail) {
  103. placetail->next = plc;
  104. } else {
  105. placeholders = plc;
  106. }
  107. placetail = plc;
  108. }
  109. }
  110. if (bindno == 0) {
  111. /* nothing to do; good! */
  112. return 0;
  113. }
  114. /* did the query make sense to me? */
  115. if (query_type == (PDO_PLACEHOLDER_NAMED|PDO_PLACEHOLDER_POSITIONAL)) {
  116. /* they mixed both types; punt */
  117. pdo_raise_impl_error(stmt->dbh, stmt, "HY093", "mixed named and positional parameters" TSRMLS_CC);
  118. ret = -1;
  119. goto clean_up;
  120. }
  121. if (stmt->supports_placeholders == query_type && !stmt->named_rewrite_template) {
  122. /* query matches native syntax */
  123. ret = 0;
  124. goto clean_up;
  125. }
  126. if (stmt->named_rewrite_template) {
  127. /* magic/hack.
  128. * We we pretend that the query was positional even if
  129. * it was named so that we fall into the
  130. * named rewrite case below. Not too pretty,
  131. * but it works. */
  132. query_type = PDO_PLACEHOLDER_POSITIONAL;
  133. }
  134. params = stmt->bound_params;
  135. /* Do we have placeholders but no bound params */
  136. if (bindno && !params && stmt->supports_placeholders == PDO_PLACEHOLDER_NONE) {
  137. pdo_raise_impl_error(stmt->dbh, stmt, "HY093", "no parameters were bound" TSRMLS_CC);
  138. ret = -1;
  139. goto clean_up;
  140. }
  141. if (params && bindno != zend_hash_num_elements(params) && stmt->supports_placeholders == PDO_PLACEHOLDER_NONE) {
  142. /* extra bit of validation for instances when same params are bound more then once */
  143. if (query_type != PDO_PLACEHOLDER_POSITIONAL && bindno > zend_hash_num_elements(params)) {
  144. int ok = 1;
  145. for (plc = placeholders; plc; plc = plc->next) {
  146. if (zend_hash_find(params, plc->pos, plc->len, (void**) &param) == FAILURE) {
  147. ok = 0;
  148. break;
  149. }
  150. }
  151. if (ok) {
  152. goto safe;
  153. }
  154. }
  155. pdo_raise_impl_error(stmt->dbh, stmt, "HY093", "number of bound variables does not match number of tokens" TSRMLS_CC);
  156. ret = -1;
  157. goto clean_up;
  158. }
  159. safe:
  160. /* what are we going to do ? */
  161. if (stmt->supports_placeholders == PDO_PLACEHOLDER_NONE) {
  162. /* query generation */
  163. newbuffer_len = inquery_len;
  164. /* let's quote all the values */
  165. for (plc = placeholders; plc; plc = plc->next) {
  166. if (query_type == PDO_PLACEHOLDER_POSITIONAL) {
  167. ret = zend_hash_index_find(params, plc->bindno, (void**) &param);
  168. } else {
  169. ret = zend_hash_find(params, plc->pos, plc->len, (void**) &param);
  170. }
  171. if (ret == FAILURE) {
  172. /* parameter was not defined */
  173. ret = -1;
  174. pdo_raise_impl_error(stmt->dbh, stmt, "HY093", "parameter was not defined" TSRMLS_CC);
  175. goto clean_up;
  176. }
  177. if (stmt->dbh->methods->quoter) {
  178. if (param->param_type == PDO_PARAM_LOB && Z_TYPE_P(param->parameter) == IS_RESOURCE) {
  179. php_stream *stm;
  180. php_stream_from_zval_no_verify(stm, &param->parameter);
  181. if (stm) {
  182. size_t len;
  183. char *buf = NULL;
  184. len = php_stream_copy_to_mem(stm, &buf, PHP_STREAM_COPY_ALL, 0);
  185. if (!stmt->dbh->methods->quoter(stmt->dbh, buf, len, &plc->quoted, &plc->qlen,
  186. param->param_type TSRMLS_CC)) {
  187. /* bork */
  188. ret = -1;
  189. strncpy(stmt->error_code, stmt->dbh->error_code, 6);
  190. if (buf) {
  191. efree(buf);
  192. }
  193. goto clean_up;
  194. }
  195. if (buf) {
  196. efree(buf);
  197. }
  198. } else {
  199. pdo_raise_impl_error(stmt->dbh, stmt, "HY105", "Expected a stream resource" TSRMLS_CC);
  200. ret = -1;
  201. goto clean_up;
  202. }
  203. plc->freeq = 1;
  204. } else {
  205. zval tmp_param = *param->parameter;
  206. zval_copy_ctor(&tmp_param);
  207. switch (Z_TYPE(tmp_param)) {
  208. case IS_NULL:
  209. plc->quoted = "NULL";
  210. plc->qlen = sizeof("NULL")-1;
  211. plc->freeq = 0;
  212. break;
  213. case IS_BOOL:
  214. convert_to_long(&tmp_param);
  215. /* fall through */
  216. case IS_LONG:
  217. case IS_DOUBLE:
  218. convert_to_string(&tmp_param);
  219. plc->qlen = Z_STRLEN(tmp_param);
  220. plc->quoted = estrdup(Z_STRVAL(tmp_param));
  221. plc->freeq = 1;
  222. break;
  223. default:
  224. convert_to_string(&tmp_param);
  225. if (!stmt->dbh->methods->quoter(stmt->dbh, Z_STRVAL(tmp_param),
  226. Z_STRLEN(tmp_param), &plc->quoted, &plc->qlen,
  227. param->param_type TSRMLS_CC)) {
  228. /* bork */
  229. ret = -1;
  230. strncpy(stmt->error_code, stmt->dbh->error_code, 6);
  231. goto clean_up;
  232. }
  233. plc->freeq = 1;
  234. }
  235. zval_dtor(&tmp_param);
  236. }
  237. } else {
  238. plc->quoted = Z_STRVAL_P(param->parameter);
  239. plc->qlen = Z_STRLEN_P(param->parameter);
  240. }
  241. newbuffer_len += plc->qlen;
  242. }
  243. rewrite:
  244. /* allocate output buffer */
  245. newbuffer = emalloc(newbuffer_len + 1);
  246. *outquery = newbuffer;
  247. /* and build the query */
  248. plc = placeholders;
  249. ptr = inquery;
  250. do {
  251. t = plc->pos - ptr;
  252. if (t) {
  253. memcpy(newbuffer, ptr, t);
  254. newbuffer += t;
  255. }
  256. memcpy(newbuffer, plc->quoted, plc->qlen);
  257. newbuffer += plc->qlen;
  258. ptr = plc->pos + plc->len;
  259. plc = plc->next;
  260. } while (plc);
  261. t = (inquery + inquery_len) - ptr;
  262. if (t) {
  263. memcpy(newbuffer, ptr, t);
  264. newbuffer += t;
  265. }
  266. *newbuffer = '\0';
  267. *outquery_len = newbuffer - *outquery;
  268. ret = 1;
  269. goto clean_up;
  270. } else if (query_type == PDO_PLACEHOLDER_POSITIONAL) {
  271. /* rewrite ? to :pdoX */
  272. char *name, *idxbuf;
  273. const char *tmpl = stmt->named_rewrite_template ? stmt->named_rewrite_template : ":pdo%d";
  274. int bind_no = 1;
  275. newbuffer_len = inquery_len;
  276. if (stmt->bound_param_map == NULL) {
  277. ALLOC_HASHTABLE(stmt->bound_param_map);
  278. zend_hash_init(stmt->bound_param_map, 13, NULL, NULL, 0);
  279. }
  280. for (plc = placeholders; plc; plc = plc->next) {
  281. int skip_map = 0;
  282. char *p;
  283. name = estrndup(plc->pos, plc->len);
  284. /* check if bound parameter is already available */
  285. if (!strcmp(name, "?") || zend_hash_find(stmt->bound_param_map, name, plc->len + 1, (void**) &p) == FAILURE) {
  286. spprintf(&idxbuf, 0, tmpl, bind_no++);
  287. } else {
  288. idxbuf = estrdup(p);
  289. skip_map = 1;
  290. }
  291. plc->quoted = idxbuf;
  292. plc->qlen = strlen(plc->quoted);
  293. plc->freeq = 1;
  294. newbuffer_len += plc->qlen;
  295. if (!skip_map && stmt->named_rewrite_template) {
  296. /* create a mapping */
  297. zend_hash_update(stmt->bound_param_map, name, plc->len + 1, idxbuf, plc->qlen + 1, NULL);
  298. }
  299. /* map number to name */
  300. zend_hash_index_update(stmt->bound_param_map, plc->bindno, idxbuf, plc->qlen + 1, NULL);
  301. efree(name);
  302. }
  303. goto rewrite;
  304. } else {
  305. /* rewrite :name to ? */
  306. newbuffer_len = inquery_len;
  307. if (stmt->bound_param_map == NULL) {
  308. ALLOC_HASHTABLE(stmt->bound_param_map);
  309. zend_hash_init(stmt->bound_param_map, 13, NULL, NULL, 0);
  310. }
  311. for (plc = placeholders; plc; plc = plc->next) {
  312. char *name;
  313. name = estrndup(plc->pos, plc->len);
  314. zend_hash_index_update(stmt->bound_param_map, plc->bindno, name, plc->len + 1, NULL);
  315. efree(name);
  316. plc->quoted = "?";
  317. plc->qlen = 1;
  318. }
  319. goto rewrite;
  320. }
  321. clean_up:
  322. while (placeholders) {
  323. plc = placeholders;
  324. placeholders = plc->next;
  325. if (plc->freeq) {
  326. efree(plc->quoted);
  327. }
  328. efree(plc);
  329. }
  330. return ret;
  331. }
  332. #if 0
  333. int old_pdo_parse_params(pdo_stmt_t *stmt, char *inquery, int inquery_len, char **outquery,
  334. int *outquery_len TSRMLS_DC)
  335. {
  336. Scanner s;
  337. char *ptr;
  338. int t;
  339. int bindno = 0;
  340. int newbuffer_len;
  341. int padding;
  342. HashTable *params = stmt->bound_params;
  343. struct pdo_bound_param_data *param;
  344. /* allocate buffer for query with expanded binds, ptr is our writing pointer */
  345. newbuffer_len = inquery_len;
  346. /* calculate the possible padding factor due to quoting */
  347. if(stmt->dbh->max_escaped_char_length) {
  348. padding = stmt->dbh->max_escaped_char_length;
  349. } else {
  350. padding = 3;
  351. }
  352. if(params) {
  353. zend_hash_internal_pointer_reset(params);
  354. while (SUCCESS == zend_hash_get_current_data(params, (void**)&param)) {
  355. if(param->parameter) {
  356. convert_to_string(param->parameter);
  357. /* accommodate a string that needs to be fully quoted
  358. bind placeholders are at least 2 characters, so
  359. the accommodate their own "'s
  360. */
  361. newbuffer_len += padding * Z_STRLEN_P(param->parameter);
  362. }
  363. zend_hash_move_forward(params);
  364. }
  365. }
  366. *outquery = (char *) emalloc(newbuffer_len + 1);
  367. *outquery_len = 0;
  368. ptr = *outquery;
  369. s.cur = inquery;
  370. while((t = scan(&s)) != PDO_PARSER_EOI) {
  371. if(t == PDO_PARSER_TEXT) {
  372. memcpy(ptr, s.tok, s.cur - s.tok);
  373. ptr += (s.cur - s.tok);
  374. *outquery_len += (s.cur - s.tok);
  375. }
  376. else if(t == PDO_PARSER_BIND) {
  377. if(!params) {
  378. /* error */
  379. efree(*outquery);
  380. *outquery = NULL;
  381. return (int) (s.cur - inquery);
  382. }
  383. /* lookup bind first via hash and then index */
  384. /* stupid keys need to be null-terminated, even though we know their length */
  385. if((SUCCESS == zend_hash_find(params, s.tok, s.cur-s.tok,(void **)&param))
  386. ||
  387. (SUCCESS == zend_hash_index_find(params, bindno, (void **)&param)))
  388. {
  389. char *quotedstr;
  390. int quotedstrlen;
  391. /* restore the in-string key, doesn't need null-termination here */
  392. /* currently everything is a string here */
  393. /* quote the bind value if necessary */
  394. if(stmt->dbh->methods->quoter(stmt->dbh, Z_STRVAL_P(param->parameter),
  395. Z_STRLEN_P(param->parameter), &quotedstr, &quotedstrlen TSRMLS_CC))
  396. {
  397. memcpy(ptr, quotedstr, quotedstrlen);
  398. ptr += quotedstrlen;
  399. *outquery_len += quotedstrlen;
  400. efree(quotedstr);
  401. } else {
  402. memcpy(ptr, Z_STRVAL_P(param->parameter), Z_STRLEN_P(param->parameter));
  403. ptr += Z_STRLEN_P(param->parameter);
  404. *outquery_len += (Z_STRLEN_P(param->parameter));
  405. }
  406. }
  407. else {
  408. /* error and cleanup */
  409. efree(*outquery);
  410. *outquery = NULL;
  411. return (int) (s.cur - inquery);
  412. }
  413. bindno++;
  414. }
  415. else if(t == PDO_PARSER_BIND_POS) {
  416. if(!params) {
  417. /* error */
  418. efree(*outquery);
  419. *outquery = NULL;
  420. return (int) (s.cur - inquery);
  421. }
  422. /* lookup bind by index */
  423. if(SUCCESS == zend_hash_index_find(params, bindno, (void **)&param))
  424. {
  425. char *quotedstr;
  426. int quotedstrlen;
  427. /* currently everything is a string here */
  428. /* quote the bind value if necessary */
  429. if(stmt->dbh->methods->quoter(stmt->dbh, Z_STRVAL_P(param->parameter),
  430. Z_STRLEN_P(param->parameter), &quotedstr, &quotedstrlen TSRMLS_CC))
  431. {
  432. memcpy(ptr, quotedstr, quotedstrlen);
  433. ptr += quotedstrlen;
  434. *outquery_len += quotedstrlen;
  435. efree(quotedstr);
  436. } else {
  437. memcpy(ptr, Z_STRVAL_P(param->parameter), Z_STRLEN_P(param->parameter));
  438. ptr += Z_STRLEN_P(param->parameter);
  439. *outquery_len += (Z_STRLEN_P(param->parameter));
  440. }
  441. }
  442. else {
  443. /* error and cleanup */
  444. efree(*outquery);
  445. *outquery = NULL;
  446. return (int) (s.cur - inquery);
  447. }
  448. bindno++;
  449. }
  450. }
  451. *ptr = '\0';
  452. return 0;
  453. }
  454. #endif
  455. /*
  456. * Local variables:
  457. * tab-width: 4
  458. * c-basic-offset: 4
  459. * End:
  460. * vim600: noet sw=4 ts=4 fdm=marker ft=c
  461. * vim<600: noet sw=4 ts=4
  462. */