123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574 |
- /*
- +----------------------------------------------------------------------+
- | PHP Version 5 |
- +----------------------------------------------------------------------+
- | Copyright (c) 1997-2016 The PHP Group |
- +----------------------------------------------------------------------+
- | This source file is subject to version 3.01 of the PHP license, |
- | that is bundled with this package in the file LICENSE, and is |
- | available through the world-wide-web at the following url: |
- | http://www.php.net/license/3_01.txt |
- | If you did not receive a copy of the PHP license and are unable to |
- | obtain it through the world-wide-web, please send a note to |
- | license@php.net so we can mail you a copy immediately. |
- +----------------------------------------------------------------------+
- | Author: Sascha Schumann <sascha@schumann.cx> |
- +----------------------------------------------------------------------+
- */
- /* $Id$ */
- #include "php.h"
- #ifdef HAVE_UNISTD_H
- #include <unistd.h>
- #endif
- #ifdef HAVE_LIMITS_H
- #include <limits.h>
- #endif
- #include <stdio.h>
- #include <stdlib.h>
- #include <string.h>
- #include "php_ini.h"
- #include "php_globals.h"
- #define STATE_TAG SOME_OTHER_STATE_TAG
- #include "basic_functions.h"
- #include "url.h"
- #undef STATE_TAG
- #define url_scanner url_scanner_ex
- #include "php_smart_str.h"
- static PHP_INI_MH(OnUpdateTags)
- {
- url_adapt_state_ex_t *ctx;
- char *key;
- char *lasts;
- char *tmp;
-
- ctx = &BG(url_adapt_state_ex);
-
- tmp = estrndup(new_value, new_value_length);
-
- if (ctx->tags)
- zend_hash_destroy(ctx->tags);
- else {
- ctx->tags = malloc(sizeof(HashTable));
- if (!ctx->tags) {
- return FAILURE;
- }
- }
- zend_hash_init(ctx->tags, 0, NULL, NULL, 1);
-
- for (key = php_strtok_r(tmp, ",", &lasts);
- key;
- key = php_strtok_r(NULL, ",", &lasts)) {
- char *val;
- val = strchr(key, '=');
- if (val) {
- char *q;
- int keylen;
-
- *val++ = '\0';
- for (q = key; *q; q++)
- *q = tolower(*q);
- keylen = q - key;
- /* key is stored withOUT NUL
- val is stored WITH NUL */
- zend_hash_add(ctx->tags, key, keylen, val, strlen(val)+1, NULL);
- }
- }
- efree(tmp);
- return SUCCESS;
- }
- PHP_INI_BEGIN()
- STD_PHP_INI_ENTRY("url_rewriter.tags", "a=href,area=href,frame=src,form=,fieldset=", PHP_INI_ALL, OnUpdateTags, url_adapt_state_ex, php_basic_globals, basic_globals)
- PHP_INI_END()
- /*!re2c
- any = [\000-\377];
- N = (any\[<]);
- alpha = [a-zA-Z];
- alphanamespace = [a-zA-Z:];
- alphadash = ([a-zA-Z] | "-");
- */
- #define YYFILL(n) goto done
- #define YYCTYPE unsigned char
- #define YYCURSOR p
- #define YYLIMIT q
- #define YYMARKER r
-
- static inline void append_modified_url(smart_str *url, smart_str *dest, smart_str *url_app, const char *separator TSRMLS_DC)
- {
- register const char *p, *q;
- const char *bash = NULL;
- const char *sep = "?";
- /*
- * Don't modify "//example.com" full path, unless
- * HTTP_HOST matches.
- */
- if (url->c[0] == '/' && url->c[1] == '/') {
- zval **tmp, **http_host;
- size_t target_len, host_len;
- if (zend_hash_find(&EG(symbol_table), "_SERVER", sizeof("_SERVER"), (void **)&tmp) == FAILURE
- || Z_TYPE_PP(tmp) != IS_ARRAY
- || zend_hash_find(Z_ARRVAL_PP(tmp), "HTTP_HOST", sizeof("HTTP_HOST"), (void **)&http_host) == FAILURE
- || Z_TYPE_PP(http_host) != IS_STRING) {
- smart_str_append(dest, url);
- return;
- }
- /* HTTP_HOST could be "example.com:8888", etc. */
- /* Need to find end of URL in buffer */
- host_len = strcspn(Z_STRVAL_PP(http_host), ":");
- target_len = strcspn(url->c+2, "/\"'?>\r\n");
- if (host_len
- && host_len == target_len
- && strncasecmp(Z_STRVAL_PP(http_host), url->c+2, host_len)) {
- smart_str_append(dest, url);
- return;
- }
- }
- q = (p = url->c) + url->len;
- scan:
- /*!re2c
- ":" { smart_str_append(dest, url); return; }
- "?" { sep = separator; goto scan; }
- "#" { bash = p - 1; goto done; }
- (any\[:?#])+ { goto scan; }
- */
- done:
-
- /* Don't modify URLs of the format "#mark" */
- if (bash && bash - url->c == 0) {
- smart_str_append(dest, url);
- return;
- }
- if (bash)
- smart_str_appendl(dest, url->c, bash - url->c);
- else
- smart_str_append(dest, url);
- smart_str_appends(dest, sep);
- smart_str_append(dest, url_app);
- if (bash)
- smart_str_appendl(dest, bash, q - bash);
- }
- #undef YYFILL
- #undef YYCTYPE
- #undef YYCURSOR
- #undef YYLIMIT
- #undef YYMARKER
- static inline void tag_arg(url_adapt_state_ex_t *ctx, char quotes, char type TSRMLS_DC)
- {
- char f = 0;
- if (strncasecmp(ctx->arg.c, ctx->lookup_data, ctx->arg.len) == 0)
- f = 1;
- if (quotes)
- smart_str_appendc(&ctx->result, type);
- if (f) {
- append_modified_url(&ctx->val, &ctx->result, &ctx->url_app, PG(arg_separator).output TSRMLS_CC);
- } else {
- smart_str_append(&ctx->result, &ctx->val);
- }
- if (quotes)
- smart_str_appendc(&ctx->result, type);
- }
- enum {
- STATE_PLAIN = 0,
- STATE_TAG,
- STATE_NEXT_ARG,
- STATE_ARG,
- STATE_BEFORE_VAL,
- STATE_VAL
- };
- #define YYFILL(n) goto stop
- #define YYCTYPE unsigned char
- #define YYCURSOR xp
- #define YYLIMIT end
- #define YYMARKER q
- #define STATE ctx->state
- #define STD_PARA url_adapt_state_ex_t *ctx, char *start, char *YYCURSOR TSRMLS_DC
- #define STD_ARGS ctx, start, xp TSRMLS_CC
- #if SCANNER_DEBUG
- #define scdebug(x) printf x
- #else
- #define scdebug(x)
- #endif
- static inline void passthru(STD_PARA)
- {
- scdebug(("appending %d chars, starting with %c\n", YYCURSOR-start, *start));
- smart_str_appendl(&ctx->result, start, YYCURSOR - start);
- }
- /*
- * This function appends a hidden input field after a <form> or
- * <fieldset>. The latter is important for XHTML.
- */
- static void handle_form(STD_PARA)
- {
- int doit = 0;
- if (ctx->form_app.len > 0) {
- switch (ctx->tag.len) {
- case sizeof("form") - 1:
- if (!strncasecmp(ctx->tag.c, "form", sizeof("form") - 1)) {
- doit = 1;
- }
- if (doit && ctx->val.c && ctx->lookup_data && *ctx->lookup_data) {
- char *e, *p = zend_memnstr(ctx->val.c, "://", sizeof("://") - 1, ctx->val.c + ctx->val.len);
- if (p) {
- e = memchr(p, '/', (ctx->val.c + ctx->val.len) - p);
- if (!e) {
- e = ctx->val.c + ctx->val.len;
- }
- if ((e - p) && strncasecmp(p, ctx->lookup_data, (e - p))) {
- doit = 0;
- }
- }
- }
- break;
- case sizeof("fieldset") - 1:
- if (!strncasecmp(ctx->tag.c, "fieldset", sizeof("fieldset") - 1)) {
- doit = 1;
- }
- break;
- }
- if (doit)
- smart_str_append(&ctx->result, &ctx->form_app);
- }
- }
- /*
- * HANDLE_TAG copies the HTML Tag and checks whether we
- * have that tag in our table. If we might modify it,
- * we continue to scan the tag, otherwise we simply copy the complete
- * HTML stuff to the result buffer.
- */
- static inline void handle_tag(STD_PARA)
- {
- int ok = 0;
- unsigned int i;
- ctx->tag.len = 0;
- smart_str_appendl(&ctx->tag, start, YYCURSOR - start);
- for (i = 0; i < ctx->tag.len; i++)
- ctx->tag.c[i] = tolower((int)(unsigned char)ctx->tag.c[i]);
- if (zend_hash_find(ctx->tags, ctx->tag.c, ctx->tag.len, (void **) &ctx->lookup_data) == SUCCESS)
- ok = 1;
- STATE = ok ? STATE_NEXT_ARG : STATE_PLAIN;
- }
- static inline void handle_arg(STD_PARA)
- {
- ctx->arg.len = 0;
- smart_str_appendl(&ctx->arg, start, YYCURSOR - start);
- }
- static inline void handle_val(STD_PARA, char quotes, char type)
- {
- smart_str_setl(&ctx->val, start + quotes, YYCURSOR - start - quotes * 2);
- tag_arg(ctx, quotes, type TSRMLS_CC);
- }
- static inline void xx_mainloop(url_adapt_state_ex_t *ctx, const char *newdata, size_t newlen TSRMLS_DC)
- {
- char *end, *q;
- char *xp;
- char *start;
- int rest;
- smart_str_appendl(&ctx->buf, newdata, newlen);
-
- YYCURSOR = ctx->buf.c;
- YYLIMIT = ctx->buf.c + ctx->buf.len;
- switch (STATE) {
- case STATE_PLAIN: goto state_plain;
- case STATE_TAG: goto state_tag;
- case STATE_NEXT_ARG: goto state_next_arg;
- case STATE_ARG: goto state_arg;
- case STATE_BEFORE_VAL: goto state_before_val;
- case STATE_VAL: goto state_val;
- }
-
- state_plain_begin:
- STATE = STATE_PLAIN;
-
- state_plain:
- start = YYCURSOR;
- /*!re2c
- "<" { passthru(STD_ARGS); STATE = STATE_TAG; goto state_tag; }
- N+ { passthru(STD_ARGS); goto state_plain; }
- */
- state_tag:
- start = YYCURSOR;
- /*!re2c
- alphanamespace+ { handle_tag(STD_ARGS); /* Sets STATE */; passthru(STD_ARGS); if (STATE == STATE_PLAIN) goto state_plain; else goto state_next_arg; }
- any { passthru(STD_ARGS); goto state_plain_begin; }
- */
- state_next_arg_begin:
- STATE = STATE_NEXT_ARG;
-
- state_next_arg:
- start = YYCURSOR;
- /*!re2c
- [/]? [>] { passthru(STD_ARGS); handle_form(STD_ARGS); goto state_plain_begin; }
- [ \v\r\t\n]+ { passthru(STD_ARGS); goto state_next_arg; }
- alpha { --YYCURSOR; STATE = STATE_ARG; goto state_arg; }
- any { passthru(STD_ARGS); goto state_plain_begin; }
- */
- state_arg:
- start = YYCURSOR;
- /*!re2c
- alpha alphadash* { passthru(STD_ARGS); handle_arg(STD_ARGS); STATE = STATE_BEFORE_VAL; goto state_before_val; }
- any { passthru(STD_ARGS); STATE = STATE_NEXT_ARG; goto state_next_arg; }
- */
- state_before_val:
- start = YYCURSOR;
- /*!re2c
- [ ]* "=" [ ]* { passthru(STD_ARGS); STATE = STATE_VAL; goto state_val; }
- any { --YYCURSOR; goto state_next_arg_begin; }
- */
- state_val:
- start = YYCURSOR;
- /*!re2c
- ["] (any\[">])* ["] { handle_val(STD_ARGS, 1, '"'); goto state_next_arg_begin; }
- ['] (any\['>])* ['] { handle_val(STD_ARGS, 1, '\''); goto state_next_arg_begin; }
- (any\[ \r\t\n>'"])+ { handle_val(STD_ARGS, 0, ' '); goto state_next_arg_begin; }
- any { passthru(STD_ARGS); goto state_next_arg_begin; }
- */
- stop:
- rest = YYLIMIT - start;
- scdebug(("stopped in state %d at pos %d (%d:%c) %d\n", STATE, YYCURSOR - ctx->buf.c, *YYCURSOR, *YYCURSOR, rest));
- /* XXX: Crash avoidance. Need to work with reporter to figure out what goes wrong */
- if (rest < 0) rest = 0;
-
- if (rest) memmove(ctx->buf.c, start, rest);
- ctx->buf.len = rest;
- }
- char *php_url_scanner_adapt_single_url(const char *url, size_t urllen, const char *name, const char *value, size_t *newlen TSRMLS_DC)
- {
- smart_str surl = {0};
- smart_str buf = {0};
- smart_str url_app = {0};
- smart_str_setl(&surl, url, urllen);
- smart_str_appends(&url_app, name);
- smart_str_appendc(&url_app, '=');
- smart_str_appends(&url_app, value);
- append_modified_url(&surl, &buf, &url_app, PG(arg_separator).output TSRMLS_CC);
- smart_str_0(&buf);
- if (newlen) *newlen = buf.len;
- smart_str_free(&url_app);
- return buf.c;
- }
- static char *url_adapt_ext(const char *src, size_t srclen, size_t *newlen, zend_bool do_flush TSRMLS_DC)
- {
- url_adapt_state_ex_t *ctx;
- char *retval;
- ctx = &BG(url_adapt_state_ex);
- xx_mainloop(ctx, src, srclen TSRMLS_CC);
- *newlen = ctx->result.len;
- if (!ctx->result.c) {
- smart_str_appendl(&ctx->result, "", 0);
- }
- smart_str_0(&ctx->result);
- if (do_flush) {
- smart_str_appendl(&ctx->result, ctx->buf.c, ctx->buf.len);
- *newlen += ctx->buf.len;
- smart_str_free(&ctx->buf);
- }
- retval = ctx->result.c;
- ctx->result.c = NULL;
- ctx->result.len = 0;
- return retval;
- }
- static int php_url_scanner_ex_activate(TSRMLS_D)
- {
- url_adapt_state_ex_t *ctx;
-
- ctx = &BG(url_adapt_state_ex);
- memset(ctx, 0, ((size_t) &((url_adapt_state_ex_t *)0)->tags));
- return SUCCESS;
- }
- static int php_url_scanner_ex_deactivate(TSRMLS_D)
- {
- url_adapt_state_ex_t *ctx;
-
- ctx = &BG(url_adapt_state_ex);
- smart_str_free(&ctx->result);
- smart_str_free(&ctx->buf);
- smart_str_free(&ctx->tag);
- smart_str_free(&ctx->arg);
- return SUCCESS;
- }
- static void php_url_scanner_output_handler(char *output, uint output_len, char **handled_output, uint *handled_output_len, int mode TSRMLS_DC)
- {
- size_t len;
- if (BG(url_adapt_state_ex).url_app.len != 0) {
- *handled_output = url_adapt_ext(output, output_len, &len, (zend_bool) (mode & (PHP_OUTPUT_HANDLER_END | PHP_OUTPUT_HANDLER_CONT | PHP_OUTPUT_HANDLER_FLUSH | PHP_OUTPUT_HANDLER_FINAL) ? 1 : 0) TSRMLS_CC);
- if (sizeof(uint) < sizeof(size_t)) {
- if (len > UINT_MAX)
- len = UINT_MAX;
- }
- *handled_output_len = len;
- } else if (BG(url_adapt_state_ex).url_app.len == 0) {
- url_adapt_state_ex_t *ctx = &BG(url_adapt_state_ex);
- if (ctx->buf.len) {
- smart_str_appendl(&ctx->result, ctx->buf.c, ctx->buf.len);
- smart_str_appendl(&ctx->result, output, output_len);
- *handled_output = ctx->result.c;
- *handled_output_len = ctx->buf.len + output_len;
- ctx->result.c = NULL;
- ctx->result.len = 0;
- smart_str_free(&ctx->buf);
- } else {
- *handled_output = estrndup(output, *handled_output_len = output_len);
- }
- } else {
- *handled_output = NULL;
- }
- }
- PHPAPI int php_url_scanner_add_var(char *name, int name_len, char *value, int value_len, int urlencode TSRMLS_DC)
- {
- char *encoded = NULL;
- int encoded_len;
- smart_str val;
-
- if (! BG(url_adapt_state_ex).active) {
- php_url_scanner_ex_activate(TSRMLS_C);
- php_output_start_internal(ZEND_STRL("URL-Rewriter"), php_url_scanner_output_handler, 0, PHP_OUTPUT_HANDLER_STDFLAGS TSRMLS_CC);
- BG(url_adapt_state_ex).active = 1;
- }
- if (BG(url_adapt_state_ex).url_app.len != 0) {
- smart_str_appends(&BG(url_adapt_state_ex).url_app, PG(arg_separator).output);
- }
- if (urlencode) {
- encoded = php_url_encode(value, value_len, &encoded_len);
- smart_str_setl(&val, encoded, encoded_len);
- } else {
- smart_str_setl(&val, value, value_len);
- }
-
- smart_str_appendl(&BG(url_adapt_state_ex).url_app, name, name_len);
- smart_str_appendc(&BG(url_adapt_state_ex).url_app, '=');
- smart_str_append(&BG(url_adapt_state_ex).url_app, &val);
- smart_str_appends(&BG(url_adapt_state_ex).form_app, "<input type=\"hidden\" name=\"");
- smart_str_appendl(&BG(url_adapt_state_ex).form_app, name, name_len);
- smart_str_appends(&BG(url_adapt_state_ex).form_app, "\" value=\"");
- smart_str_append(&BG(url_adapt_state_ex).form_app, &val);
- smart_str_appends(&BG(url_adapt_state_ex).form_app, "\" />");
- if (urlencode)
- efree(encoded);
- return SUCCESS;
- }
- PHPAPI int php_url_scanner_reset_vars(TSRMLS_D)
- {
- BG(url_adapt_state_ex).form_app.len = 0;
- BG(url_adapt_state_ex).url_app.len = 0;
- return SUCCESS;
- }
- PHP_MINIT_FUNCTION(url_scanner)
- {
- BG(url_adapt_state_ex).tags = NULL;
- BG(url_adapt_state_ex).form_app.c = BG(url_adapt_state_ex).url_app.c = 0;
- BG(url_adapt_state_ex).form_app.len = BG(url_adapt_state_ex).url_app.len = 0;
- REGISTER_INI_ENTRIES();
- return SUCCESS;
- }
- PHP_MSHUTDOWN_FUNCTION(url_scanner)
- {
- UNREGISTER_INI_ENTRIES();
- return SUCCESS;
- }
- PHP_RINIT_FUNCTION(url_scanner)
- {
- BG(url_adapt_state_ex).active = 0;
-
- return SUCCESS;
- }
- PHP_RSHUTDOWN_FUNCTION(url_scanner)
- {
- if (BG(url_adapt_state_ex).active) {
- php_url_scanner_ex_deactivate(TSRMLS_C);
- BG(url_adapt_state_ex).active = 0;
- }
- smart_str_free(&BG(url_adapt_state_ex).form_app);
- smart_str_free(&BG(url_adapt_state_ex).url_app);
- return SUCCESS;
- }
|