mysqlnd_charset.c 38 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951
  1. /*
  2. +----------------------------------------------------------------------+
  3. | PHP Version 7 |
  4. +----------------------------------------------------------------------+
  5. | Copyright (c) 2006-2018 The PHP Group |
  6. +----------------------------------------------------------------------+
  7. | This source file is subject to version 3.01 of the PHP license, |
  8. | that is bundled with this package in the file LICENSE, and is |
  9. | available through the world-wide-web at the following url: |
  10. | http://www.php.net/license/3_01.txt |
  11. | If you did not receive a copy of the PHP license and are unable to |
  12. | obtain it through the world-wide-web, please send a note to |
  13. | license@php.net so we can mail you a copy immediately. |
  14. +----------------------------------------------------------------------+
  15. | Authors: Andrey Hristov <andrey@php.net> |
  16. | Ulf Wendel <uw@php.net> |
  17. | Georg Richter <georg@php.net> |
  18. +----------------------------------------------------------------------+
  19. */
  20. #include "php.h"
  21. #include "mysqlnd.h"
  22. #include "mysqlnd_priv.h"
  23. #include "mysqlnd_debug.h"
  24. #include "mysqlnd_charset.h"
  25. /* {{{ utf8 functions */
  26. static unsigned int check_mb_utf8mb3_sequence(const char *start, const char *end)
  27. {
  28. zend_uchar c;
  29. if (start >= end) {
  30. return 0;
  31. }
  32. c = (zend_uchar) start[0];
  33. if (c < 0x80) {
  34. return 1; /* single byte character */
  35. }
  36. if (c < 0xC2) {
  37. return 0; /* invalid mb character */
  38. }
  39. if (c < 0xE0) {
  40. if (start + 2 > end) {
  41. return 0; /* too small */
  42. }
  43. if (!(((zend_uchar)start[1] ^ 0x80) < 0x40)) {
  44. return 0;
  45. }
  46. return 2;
  47. }
  48. if (c < 0xF0) {
  49. if (start + 3 > end) {
  50. return 0; /* too small */
  51. }
  52. if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 && ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
  53. (c >= 0xE1 || (zend_uchar)start[1] >= 0xA0))) {
  54. return 0; /* invalid utf8 character */
  55. }
  56. return 3;
  57. }
  58. return 0;
  59. }
  60. static unsigned int check_mb_utf8_sequence(const char *start, const char *end)
  61. {
  62. zend_uchar c;
  63. if (start >= end) {
  64. return 0;
  65. }
  66. c = (zend_uchar) start[0];
  67. if (c < 0x80) {
  68. return 1; /* single byte character */
  69. }
  70. if (c < 0xC2) {
  71. return 0; /* invalid mb character */
  72. }
  73. if (c < 0xE0) {
  74. if (start + 2 > end) {
  75. return 0; /* too small */
  76. }
  77. if (!(((zend_uchar)start[1] ^ 0x80) < 0x40)) {
  78. return 0;
  79. }
  80. return 2;
  81. }
  82. if (c < 0xF0) {
  83. if (start + 3 > end) {
  84. return 0; /* too small */
  85. }
  86. if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 && ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
  87. (c >= 0xE1 || (zend_uchar)start[1] >= 0xA0))) {
  88. return 0; /* invalid utf8 character */
  89. }
  90. return 3;
  91. }
  92. if (c < 0xF5) {
  93. if (start + 4 > end) { /* We need 4 characters */
  94. return 0; /* too small */
  95. }
  96. /*
  97. UTF-8 quick four-byte mask:
  98. 11110xxx 10xxxxxx 10xxxxxx 10xxxxxx
  99. Encoding allows to encode U+00010000..U+001FFFFF
  100. The maximum character defined in the Unicode standard is U+0010FFFF.
  101. Higher characters U+00110000..U+001FFFFF are not used.
  102. 11110000.10010000.10xxxxxx.10xxxxxx == F0.90.80.80 == U+00010000 (min)
  103. 11110100.10001111.10111111.10111111 == F4.8F.BF.BF == U+0010FFFF (max)
  104. Valid codes:
  105. [F0][90..BF][80..BF][80..BF]
  106. [F1][80..BF][80..BF][80..BF]
  107. [F2][80..BF][80..BF][80..BF]
  108. [F3][80..BF][80..BF][80..BF]
  109. [F4][80..8F][80..BF][80..BF]
  110. */
  111. if (!(((zend_uchar)start[1] ^ 0x80) < 0x40 &&
  112. ((zend_uchar)start[2] ^ 0x80) < 0x40 &&
  113. ((zend_uchar)start[3] ^ 0x80) < 0x40 &&
  114. (c >= 0xf1 || (zend_uchar)start[1] >= 0x90) &&
  115. (c <= 0xf3 || (zend_uchar)start[1] <= 0x8F)))
  116. {
  117. return 0; /* invalid utf8 character */
  118. }
  119. return 4;
  120. }
  121. return 0;
  122. }
  123. static unsigned int check_mb_utf8mb3_valid(const char *start, const char *end)
  124. {
  125. unsigned int len = check_mb_utf8mb3_sequence(start, end);
  126. return (len > 1)? len:0;
  127. }
  128. static unsigned int check_mb_utf8_valid(const char *start, const char *end)
  129. {
  130. unsigned int len = check_mb_utf8_sequence(start, end);
  131. return (len > 1)? len:0;
  132. }
  133. static unsigned int mysqlnd_mbcharlen_utf8mb3(unsigned int utf8)
  134. {
  135. if (utf8 < 0x80) {
  136. return 1; /* single byte character */
  137. }
  138. if (utf8 < 0xC2) {
  139. return 0; /* invalid multibyte header */
  140. }
  141. if (utf8 < 0xE0) {
  142. return 2; /* double byte character */
  143. }
  144. if (utf8 < 0xF0) {
  145. return 3; /* triple byte character */
  146. }
  147. return 0;
  148. }
  149. static unsigned int mysqlnd_mbcharlen_utf8(unsigned int utf8)
  150. {
  151. if (utf8 < 0x80) {
  152. return 1; /* single byte character */
  153. }
  154. if (utf8 < 0xC2) {
  155. return 0; /* invalid multibyte header */
  156. }
  157. if (utf8 < 0xE0) {
  158. return 2; /* double byte character */
  159. }
  160. if (utf8 < 0xF0) {
  161. return 3; /* triple byte character */
  162. }
  163. if (utf8 < 0xF8) {
  164. return 4; /* four byte character */
  165. }
  166. return 0;
  167. }
  168. /* }}} */
  169. /* {{{ big5 functions */
  170. #define valid_big5head(c) (0xA1 <= (unsigned int)(c) && (unsigned int)(c) <= 0xF9)
  171. #define valid_big5tail(c) ((0x40 <= (unsigned int)(c) && (unsigned int)(c) <= 0x7E) || \
  172. (0xA1 <= (unsigned int)(c) && (unsigned int)(c) <= 0xFE))
  173. #define isbig5code(c,d) (isbig5head(c) && isbig5tail(d))
  174. static unsigned int check_mb_big5(const char *start, const char *end)
  175. {
  176. return (valid_big5head(*(start)) && (end - start) > 1 && valid_big5tail(*(start + 1)) ? 2 : 0);
  177. }
  178. static unsigned int mysqlnd_mbcharlen_big5(unsigned int big5)
  179. {
  180. return (valid_big5head(big5)) ? 2 : 1;
  181. }
  182. /* }}} */
  183. /* {{{ cp932 functions */
  184. #define valid_cp932head(c) ((0x81 <= (c) && (c) <= 0x9F) || (0xE0 <= (c) && c <= 0xFC))
  185. #define valid_cp932tail(c) ((0x40 <= (c) && (c) <= 0x7E) || (0x80 <= (c) && c <= 0xFC))
  186. static unsigned int check_mb_cp932(const char *start, const char *end)
  187. {
  188. return (valid_cp932head((zend_uchar)start[0]) && (end - start > 1) &&
  189. valid_cp932tail((zend_uchar)start[1])) ? 2 : 0;
  190. }
  191. static unsigned int mysqlnd_mbcharlen_cp932(unsigned int cp932)
  192. {
  193. return (valid_cp932head((zend_uchar)cp932)) ? 2 : 1;
  194. }
  195. /* }}} */
  196. /* {{{ euckr functions */
  197. #define valid_euckr(c) ((0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xFE))
  198. static unsigned int check_mb_euckr(const char *start, const char *end)
  199. {
  200. if (end - start <= 1) {
  201. return 0; /* invalid length */
  202. }
  203. if (*(zend_uchar *)start < 0x80) {
  204. return 0; /* invalid euckr character */
  205. }
  206. if (valid_euckr(start[1])) {
  207. return 2;
  208. }
  209. return 0;
  210. }
  211. static unsigned int mysqlnd_mbcharlen_euckr(unsigned int kr)
  212. {
  213. return (valid_euckr(kr)) ? 2 : 1;
  214. }
  215. /* }}} */
  216. /* {{{ eucjpms functions */
  217. #define valid_eucjpms(c) (((c) & 0xFF) >= 0xA1 && ((c) & 0xFF) <= 0xFE)
  218. #define valid_eucjpms_kata(c) (((c) & 0xFF) >= 0xA1 && ((c) & 0xFF) <= 0xDF)
  219. #define valid_eucjpms_ss2(c) (((c) & 0xFF) == 0x8E)
  220. #define valid_eucjpms_ss3(c) (((c) & 0xFF) == 0x8F)
  221. static unsigned int check_mb_eucjpms(const char *start, const char *end)
  222. {
  223. if (*((zend_uchar *)start) < 0x80) {
  224. return 0; /* invalid eucjpms character */
  225. }
  226. if (valid_eucjpms(start[0]) && (end - start) > 1 && valid_eucjpms(start[1])) {
  227. return 2;
  228. }
  229. if (valid_eucjpms_ss2(start[0]) && (end - start) > 1 && valid_eucjpms_kata(start[1])) {
  230. return 2;
  231. }
  232. if (valid_eucjpms_ss3(start[0]) && (end - start) > 2 && valid_eucjpms(start[1]) &&
  233. valid_eucjpms(start[2])) {
  234. return 2;
  235. }
  236. return 0;
  237. }
  238. static unsigned int mysqlnd_mbcharlen_eucjpms(unsigned int jpms)
  239. {
  240. if (valid_eucjpms(jpms) || valid_eucjpms_ss2(jpms)) {
  241. return 2;
  242. }
  243. if (valid_eucjpms_ss3(jpms)) {
  244. return 3;
  245. }
  246. return 1;
  247. }
  248. /* }}} */
  249. /* {{{ gb2312 functions */
  250. #define valid_gb2312_head(c) (0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xF7)
  251. #define valid_gb2312_tail(c) (0xA1 <= (zend_uchar)(c) && (zend_uchar)(c) <= 0xFE)
  252. static unsigned int check_mb_gb2312(const char *start, const char *end)
  253. {
  254. return (valid_gb2312_head((unsigned int)start[0]) && end - start > 1 &&
  255. valid_gb2312_tail((unsigned int)start[1])) ? 2 : 0;
  256. }
  257. static unsigned int mysqlnd_mbcharlen_gb2312(unsigned int gb)
  258. {
  259. return (valid_gb2312_head(gb)) ? 2 : 1;
  260. }
  261. /* }}} */
  262. /* {{{ gbk functions */
  263. #define valid_gbk_head(c) (0x81<=(zend_uchar)(c) && (zend_uchar)(c)<=0xFE)
  264. #define valid_gbk_tail(c) ((0x40<=(zend_uchar)(c) && (zend_uchar)(c)<=0x7E) || (0x80<=(zend_uchar)(c) && (zend_uchar)(c)<=0xFE))
  265. static unsigned int check_mb_gbk(const char *start, const char *end)
  266. {
  267. return (valid_gbk_head(start[0]) && (end) - (start) > 1 && valid_gbk_tail(start[1])) ? 2 : 0;
  268. }
  269. static unsigned int mysqlnd_mbcharlen_gbk(unsigned int gbk)
  270. {
  271. return (valid_gbk_head(gbk) ? 2 : 1);
  272. }
  273. /* }}} */
  274. /* {{{ sjis functions */
  275. #define valid_sjis_head(c) ((0x81 <= (c) && (c) <= 0x9F) || (0xE0 <= (c) && (c) <= 0xFC))
  276. #define valid_sjis_tail(c) ((0x40 <= (c) && (c) <= 0x7E) || (0x80 <= (c) && (c) <= 0xFC))
  277. static unsigned int check_mb_sjis(const char *start, const char *end)
  278. {
  279. return (valid_sjis_head((zend_uchar)start[0]) && (end - start) > 1 && valid_sjis_tail((zend_uchar)start[1])) ? 2 : 0;
  280. }
  281. static unsigned int mysqlnd_mbcharlen_sjis(unsigned int sjis)
  282. {
  283. return (valid_sjis_head((zend_uchar)sjis)) ? 2 : 1;
  284. }
  285. /* }}} */
  286. /* {{{ ucs2 functions */
  287. static unsigned int check_mb_ucs2(const char *start __attribute((unused)), const char *end __attribute((unused)))
  288. {
  289. return 2; /* always 2 */
  290. }
  291. static unsigned int mysqlnd_mbcharlen_ucs2(unsigned int ucs2 __attribute((unused)))
  292. {
  293. return 2; /* always 2 */
  294. }
  295. /* }}} */
  296. /* {{{ ujis functions */
  297. #define valid_ujis(c) ((0xA1 <= ((c)&0xFF) && ((c)&0xFF) <= 0xFE))
  298. #define valid_ujis_kata(c) ((0xA1 <= ((c)&0xFF) && ((c)&0xFF) <= 0xDF))
  299. #define valid_ujis_ss2(c) (((c)&0xFF) == 0x8E)
  300. #define valid_ujis_ss3(c) (((c)&0xFF) == 0x8F)
  301. static unsigned int check_mb_ujis(const char *start, const char *end)
  302. {
  303. if (*(zend_uchar*)start < 0x80) {
  304. return 0; /* invalid ujis character */
  305. }
  306. if (valid_ujis(*(start)) && valid_ujis(*((start)+1))) {
  307. return 2;
  308. }
  309. if (valid_ujis_ss2(*(start)) && valid_ujis_kata(*((start)+1))) {
  310. return 2;
  311. }
  312. if (valid_ujis_ss3(*(start)) && (end-start) > 2 && valid_ujis(*((start)+1)) && valid_ujis(*((start)+2))) {
  313. return 3;
  314. }
  315. return 0;
  316. }
  317. static unsigned int mysqlnd_mbcharlen_ujis(unsigned int ujis)
  318. {
  319. return (valid_ujis(ujis)? 2: valid_ujis_ss2(ujis)? 2: valid_ujis_ss3(ujis)? 3: 1);
  320. }
  321. /* }}} */
  322. /* {{{ utf16 functions */
  323. #define UTF16_HIGH_HEAD(x) ((((zend_uchar) (x)) & 0xFC) == 0xD8)
  324. #define UTF16_LOW_HEAD(x) ((((zend_uchar) (x)) & 0xFC) == 0xDC)
  325. static unsigned int check_mb_utf16(const char *start, const char *end)
  326. {
  327. if (start + 2 > end) {
  328. return 0;
  329. }
  330. if (UTF16_HIGH_HEAD(*start)) {
  331. return (start + 4 <= end) && UTF16_LOW_HEAD(start[2]) ? 4 : 0;
  332. }
  333. if (UTF16_LOW_HEAD(*start)) {
  334. return 0;
  335. }
  336. return 2;
  337. }
  338. static uint32_t mysqlnd_mbcharlen_utf16(unsigned int utf16)
  339. {
  340. return UTF16_HIGH_HEAD(utf16) ? 4 : 2;
  341. }
  342. /* }}} */
  343. /* {{{ utf32 functions */
  344. static unsigned int check_mb_utf32(const char *start __attribute((unused)), const char *end __attribute((unused)))
  345. {
  346. return 4;
  347. }
  348. static unsigned int mysqlnd_mbcharlen_utf32(unsigned int utf32 __attribute((unused)))
  349. {
  350. return 4;
  351. }
  352. /* }}} */
  353. /* {{{ gb18030 functions */
  354. #define is_gb18030_odd(c) (0x81 <= (zend_uchar) (c) && (zend_uchar) (c) <= 0xFE)
  355. #define is_gb18030_even_2(c) ((0x40 <= (zend_uchar) (c) && (zend_uchar) (c) <= 0x7E) || (0x80 <= (zend_uchar) (c) && (zend_uchar) (c) <= 0xFE))
  356. #define is_gb18030_even_4(c) (0x30 <= (zend_uchar) (c) && (zend_uchar) (c) <= 0x39)
  357. static unsigned int mysqlnd_mbcharlen_gb18030(unsigned int c)
  358. {
  359. if (c <= 0xFF) {
  360. return !is_gb18030_odd(c);
  361. }
  362. if (c > 0xFFFF || !is_gb18030_odd((c >> 8) & 0xFF)) {
  363. return 0;
  364. }
  365. if (is_gb18030_even_2((c & 0xFF))) {
  366. return 2;
  367. }
  368. if (is_gb18030_even_4((c & 0xFF))) {
  369. return 4;
  370. }
  371. return 0;
  372. }
  373. static unsigned int my_ismbchar_gb18030(const char * start, const char * end)
  374. {
  375. if (end - start <= 1 || !is_gb18030_odd(start[0])) {
  376. return 0;
  377. }
  378. if (is_gb18030_even_2(start[1])) {
  379. return 2;
  380. } else if (end - start > 3 && is_gb18030_even_4(start[1]) && is_gb18030_odd(start[2]) && is_gb18030_even_4(start[3])) {
  381. return 4;
  382. }
  383. return 0;
  384. }
  385. /* }}} */
  386. /*
  387. The server compiles sometimes the full utf-8 (the mb4) as utf8m4, and the old as utf8,
  388. for BC reasons. Sometimes, utf8mb4 is just utf8 but the old charsets are utf8mb3.
  389. Change easily now, with a macro, could be made compilastion dependable.
  390. */
  391. #define UTF8_MB4 "utf8mb4"
  392. #define UTF8_MB3 "utf8"
  393. /* {{{ mysqlnd_charsets */
  394. const MYSQLND_CHARSET mysqlnd_charsets[] =
  395. {
  396. { 1, "big5","big5_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_big5, check_mb_big5},
  397. { 3, "dec8", "dec8_swedish_ci", 1, 1, "", NULL, NULL},
  398. { 4, "cp850", "cp850_general_ci", 1, 1, "", NULL, NULL},
  399. { 6, "hp8", "hp8_english_ci", 1, 1, "", NULL, NULL},
  400. { 7, "koi8r", "koi8r_general_ci", 1, 1, "", NULL, NULL},
  401. { 8, "latin1", "latin1_swedish_ci", 1, 1, "", NULL, NULL},
  402. { 5, "latin1", "latin1_german1_ci", 1, 1, "", NULL, NULL}, /* should be after 0x8 because swedish_ci is the default collation */
  403. { 9, "latin2", "latin2_general_ci", 1, 1, "", NULL, NULL},
  404. { 2, "latin2", "latin2_czech_cs", 1, 1, "", NULL, NULL}, /* should be after 0x9 because general_ci is the default collation */
  405. { 10, "swe7", "swe7_swedish_ci", 1, 1, "", NULL, NULL},
  406. { 11, "ascii", "ascii_general_ci", 1, 1, "", NULL, NULL},
  407. { 12, "ujis", "ujis_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_ujis, check_mb_ujis},
  408. { 13, "sjis", "sjis_japanese_ci", 1, 2, "", mysqlnd_mbcharlen_sjis, check_mb_sjis},
  409. { 16, "hebrew", "hebrew_general_ci", 1, 1, "", NULL, NULL},
  410. { 17, "filename", "filename", 1, 5, "", NULL, NULL},
  411. { 18, "tis620", "tis620_thai_ci", 1, 1, "", NULL, NULL},
  412. { 19, "euckr", "euckr_korean_ci", 1, 2, "", mysqlnd_mbcharlen_euckr, check_mb_euckr},
  413. { 21, "latin2", "latin2_hungarian_ci", 1, 1, "", NULL, NULL},
  414. { 27, "latin2", "latin2_croatian_ci", 1, 1, "", NULL, NULL},
  415. { 22, "koi8u", "koi8u_general_ci", 1, 1, "", NULL, NULL},
  416. { 24, "gb2312", "gb2312_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_gb2312, check_mb_gb2312},
  417. { 25, "greek", "greek_general_ci", 1, 1, "", NULL, NULL},
  418. { 26, "cp1250", "cp1250_general_ci", 1, 1, "", NULL, NULL},
  419. { 28, "gbk", "gbk_chinese_ci", 1, 2, "", mysqlnd_mbcharlen_gbk, check_mb_gbk},
  420. { 30, "latin5", "latin5_turkish_ci", 1, 1, "", NULL, NULL},
  421. { 31, "latin1", "latin1_german2_ci", 1, 1, "", NULL, NULL},
  422. { 15, "latin1", "latin1_danish_ci", 1, 1, "", NULL, NULL},
  423. { 32, "armscii8", "armscii8_general_ci", 1, 1, "", NULL, NULL},
  424. { 33, UTF8_MB3, UTF8_MB3"_general_ci", 1, 3, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  425. { 35, "ucs2", "ucs2_general_ci", 2, 2, "UCS-2 Unicode", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  426. { 36, "cp866", "cp866_general_ci", 1, 1, "", NULL, NULL},
  427. { 37, "keybcs2", "keybcs2_general_ci", 1, 1, "", NULL, NULL},
  428. { 38, "macce", "macce_general_ci", 1, 1, "", NULL, NULL},
  429. { 39, "macroman", "macroman_general_ci", 1, 1, "", NULL, NULL},
  430. { 40, "cp852", "cp852_general_ci", 1, 1, "", NULL, NULL},
  431. { 41, "latin7", "latin7_general_ci", 1, 1, "", NULL, NULL},
  432. { 20, "latin7", "latin7_estonian_cs", 1, 1, "", NULL, NULL},
  433. { 57, "cp1256", "cp1256_general_ci", 1, 1, "", NULL, NULL},
  434. { 59, "cp1257", "cp1257_general_ci", 1, 1, "", NULL, NULL},
  435. { 63, "binary", "binary", 1, 1, "", NULL, NULL},
  436. { 97, "eucjpms", "eucjpms_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
  437. { 29, "cp1257", "cp1257_lithuanian_ci", 1, 1, "", NULL, NULL},
  438. { 31, "latin1", "latin1_german2_ci", 1, 1, "", NULL, NULL},
  439. { 34, "cp1250", "cp1250_czech_cs", 1, 1, "", NULL, NULL},
  440. { 42, "latin7", "latin7_general_cs", 1, 1, "", NULL, NULL},
  441. { 43, "macce", "macce_bin", 1, 1, "", NULL, NULL},
  442. { 44, "cp1250", "cp1250_croatian_ci", 1, 1, "", NULL, NULL},
  443. { 45, UTF8_MB4, UTF8_MB4"_general_ci", 1, 4, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  444. { 46, UTF8_MB4, UTF8_MB4"_bin", 1, 4, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  445. { 47, "latin1", "latin1_bin", 1, 1, "", NULL, NULL},
  446. { 48, "latin1", "latin1_general_ci", 1, 1, "", NULL, NULL},
  447. { 49, "latin1", "latin1_general_cs", 1, 1, "", NULL, NULL},
  448. { 51, "cp1251", "cp1251_general_ci", 1, 1, "", NULL, NULL},
  449. { 14, "cp1251", "cp1251_bulgarian_ci", 1, 1, "", NULL, NULL},
  450. { 23, "cp1251", "cp1251_ukrainian_ci", 1, 1, "", NULL, NULL},
  451. { 50, "cp1251", "cp1251_bin", 1, 1, "", NULL, NULL},
  452. { 52, "cp1251", "cp1251_general_cs", 1, 1, "", NULL, NULL},
  453. { 53, "macroman", "macroman_bin", 1, 1, "", NULL, NULL},
  454. { 54, "utf16", "utf16_general_ci", 2, 4, "UTF-16 Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
  455. { 55, "utf16", "utf16_bin", 2, 4, "UTF-16 Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
  456. { 56, "utf16le", "utf16le_general_ci", 2, 4, "UTF-16LE Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
  457. { 58, "cp1257", "cp1257_bin", 1, 1, "", NULL, NULL},
  458. /*55*/{ 60, "utf32", "utf32_general_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  459. /*55*/{ 61, "utf32", "utf32_bin", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  460. { 62, "utf16le", "utf16le_bin", 2, 4, "UTF-16LE Unicode", mysqlnd_mbcharlen_utf16, check_mb_utf16},
  461. { 64, "armscii8", "armscii8_bin", 1, 1, "", NULL, NULL},
  462. { 65, "ascii", "ascii_bin", 1, 1, "", NULL, NULL},
  463. { 66, "cp1250", "cp1250_bin", 1, 1, "", NULL, NULL},
  464. { 67, "cp1256", "cp1256_bin", 1, 1, "", NULL, NULL},
  465. { 68, "cp866", "cp866_bin", 1, 1, "", NULL, NULL},
  466. { 69, "dec8", "dec8_bin", 1, 1, "", NULL, NULL},
  467. { 70, "greek", "greek_bin", 1, 1, "", NULL, NULL},
  468. { 71, "hebrew", "hebrew_bin", 1, 1, "", NULL, NULL},
  469. { 72, "hp8", "hp8_bin", 1, 1, "", NULL, NULL},
  470. { 73, "keybcs2", "keybcs2_bin", 1, 1, "", NULL, NULL},
  471. { 74, "koi8r", "koi8r_bin", 1, 1, "", NULL, NULL},
  472. { 75, "koi8u", "koi8u_bin", 1, 1, "", NULL, NULL},
  473. { 77, "latin2", "latin2_bin", 1, 1, "", NULL, NULL},
  474. { 78, "latin5", "latin5_bin", 1, 1, "", NULL, NULL},
  475. { 79, "latin7", "latin7_bin", 1, 1, "", NULL, NULL},
  476. { 80, "cp850", "cp850_bin", 1, 1, "", NULL, NULL},
  477. { 81, "cp852", "cp852_bin", 1, 1, "", NULL, NULL},
  478. { 82, "swe7", "swe7_bin", 1, 1, "", NULL, NULL},
  479. { 83, UTF8_MB3, UTF8_MB3"_bin", 1, 3, "UTF-8 Unicode", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  480. { 84, "big5", "big5_bin", 1, 2, "", mysqlnd_mbcharlen_big5, check_mb_big5},
  481. { 85, "euckr", "euckr_bin", 1, 2, "", mysqlnd_mbcharlen_euckr, check_mb_euckr},
  482. { 86, "gb2312", "gb2312_bin", 1, 2, "", mysqlnd_mbcharlen_gb2312, check_mb_gb2312},
  483. { 87, "gbk", "gbk_bin", 1, 2, "", mysqlnd_mbcharlen_gbk, check_mb_gbk},
  484. { 88, "sjis", "sjis_bin", 1, 2, "", mysqlnd_mbcharlen_sjis, check_mb_sjis},
  485. { 89, "tis620", "tis620_bin", 1, 1, "", NULL, NULL},
  486. { 90, "ucs2", "ucs2_bin", 2, 2, "UCS-2 Unicode", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  487. { 91, "ujis", "ujis_bin", 1, 3, "", mysqlnd_mbcharlen_ujis, check_mb_ujis},
  488. { 92, "geostd8", "geostd8_general_ci", 1, 1, "", NULL, NULL},
  489. { 93, "geostd8", "geostd8_bin", 1, 1, "", NULL, NULL},
  490. { 94, "latin1", "latin1_spanish_ci", 1, 1, "", NULL, NULL},
  491. { 95, "cp932", "cp932_japanese_ci", 1, 2, "", mysqlnd_mbcharlen_cp932, check_mb_cp932},
  492. { 96, "cp932", "cp932_bin", 1, 2, "", mysqlnd_mbcharlen_cp932, check_mb_cp932},
  493. { 97, "eucjpms", "eucjpms_japanese_ci", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
  494. { 98, "eucjpms", "eucjpms_bin", 1, 3, "", mysqlnd_mbcharlen_eucjpms, check_mb_eucjpms},
  495. { 99, "cp1250", "cp1250_polish_ci", 1, 1, "", NULL, NULL},
  496. { 128, "ucs2", "ucs2_unicode_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  497. { 129, "ucs2", "ucs2_icelandic_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  498. { 130, "ucs2", "ucs2_latvian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  499. { 131, "ucs2", "ucs2_romanian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  500. { 132, "ucs2", "ucs2_slovenian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  501. { 133, "ucs2", "ucs2_polish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  502. { 134, "ucs2", "ucs2_estonian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  503. { 135, "ucs2", "ucs2_spanish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  504. { 136, "ucs2", "ucs2_swedish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  505. { 137, "ucs2", "ucs2_turkish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  506. { 138, "ucs2", "ucs2_czech_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  507. { 139, "ucs2", "ucs2_danish_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  508. { 140, "ucs2", "ucs2_lithuanian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  509. { 141, "ucs2", "ucs2_slovak_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  510. { 142, "ucs2", "ucs2_spanish2_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  511. { 143, "ucs2", "ucs2_roman_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  512. { 144, "ucs2", "ucs2_persian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  513. { 145, "ucs2", "ucs2_esperanto_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  514. { 146, "ucs2", "ucs2_hungarian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  515. { 147, "ucs2", "ucs2_sinhala_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  516. { 148, "ucs2", "ucs2_german2_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  517. { 149, "ucs2", "ucs2_croatian_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  518. { 150, "ucs2", "ucs2_unicode_520_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  519. { 151, "ucs2", "ucs2_vietnamese_ci", 2, 2, "", mysqlnd_mbcharlen_ucs2, check_mb_ucs2},
  520. /*56*/{160, "utf32", "utf32_unicode_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  521. /*56*/{161, "utf32", "utf32_icelandic_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  522. /*56*/{162, "utf32", "utf32_latvian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  523. /*56*/{163, "utf32", "utf32_romanian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  524. /*56*/{164, "utf32", "utf32_slovenian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  525. /*56*/{165, "utf32", "utf32_polish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  526. /*56*/{166, "utf32", "utf32_estonian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  527. /*56*/{167, "utf32", "utf32_spanish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  528. /*56*/{168, "utf32", "utf32_swedish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  529. /*56*/{169, "utf32", "utf32_turkish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  530. /*56*/{170, "utf32", "utf32_czech_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  531. /*56*/{171, "utf32", "utf32_danish_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  532. /*56*/{172, "utf32", "utf32_lithuanian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  533. /*56*/{173, "utf32", "utf32_slovak_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  534. /*56*/{174, "utf32", "utf32_spanish2_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  535. /*56*/{175, "utf32", "utf32_roman_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  536. /*56*/{176, "utf32", "utf32_persian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  537. /*56*/{177, "utf32", "utf32_esperanto_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  538. /*56*/{178, "utf32", "utf32_hungarian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  539. /*56*/{179, "utf32", "utf32_sinhala_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  540. /*56*/{180, "utf32", "utf32_german2_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  541. /*56*/{181, "utf32", "utf32_croatian_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  542. /*56*/{182, "utf32", "utf32_unicode_520_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  543. /*56*/{183, "utf32", "utf32_vietnamese_ci", 4, 4, "UTF-32 Unicode", mysqlnd_mbcharlen_utf32, check_mb_utf32},
  544. { 192, UTF8_MB3, UTF8_MB3"_unicode_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  545. { 193, UTF8_MB3, UTF8_MB3"_icelandic_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  546. { 194, UTF8_MB3, UTF8_MB3"_latvian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  547. { 195, UTF8_MB3, UTF8_MB3"_romanian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  548. { 196, UTF8_MB3, UTF8_MB3"_slovenian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  549. { 197, UTF8_MB3, UTF8_MB3"_polish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  550. { 198, UTF8_MB3, UTF8_MB3"_estonian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  551. { 199, UTF8_MB3, UTF8_MB3"_spanish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  552. { 200, UTF8_MB3, UTF8_MB3"_swedish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  553. { 201, UTF8_MB3, UTF8_MB3"_turkish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  554. { 202, UTF8_MB3, UTF8_MB3"_czech_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  555. { 203, UTF8_MB3, UTF8_MB3"_danish_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid },
  556. { 204, UTF8_MB3, UTF8_MB3"_lithuanian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid },
  557. { 205, UTF8_MB3, UTF8_MB3"_slovak_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  558. { 206, UTF8_MB3, UTF8_MB3"_spanish2_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  559. { 207, UTF8_MB3, UTF8_MB3"_roman_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  560. { 208, UTF8_MB3, UTF8_MB3"_persian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  561. { 209, UTF8_MB3, UTF8_MB3"_esperanto_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  562. { 210, UTF8_MB3, UTF8_MB3"_hungarian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  563. { 211, UTF8_MB3, UTF8_MB3"_sinhala_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  564. { 212, UTF8_MB3, UTF8_MB3"_german2_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  565. { 213, UTF8_MB3, UTF8_MB3"_croatian_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  566. { 214, UTF8_MB3, UTF8_MB3"_unicode_520_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  567. { 215, UTF8_MB3, UTF8_MB3"_vietnamese_ci", 1, 3, "", mysqlnd_mbcharlen_utf8mb3, check_mb_utf8mb3_valid},
  568. { 224, UTF8_MB4, UTF8_MB4"_unicode_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  569. { 225, UTF8_MB4, UTF8_MB4"_icelandic_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  570. { 226, UTF8_MB4, UTF8_MB4"_latvian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  571. { 227, UTF8_MB4, UTF8_MB4"_romanian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  572. { 228, UTF8_MB4, UTF8_MB4"_slovenian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  573. { 229, UTF8_MB4, UTF8_MB4"_polish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  574. { 230, UTF8_MB4, UTF8_MB4"_estonian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  575. { 231, UTF8_MB4, UTF8_MB4"_spanish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  576. { 232, UTF8_MB4, UTF8_MB4"_swedish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  577. { 233, UTF8_MB4, UTF8_MB4"_turkish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  578. { 234, UTF8_MB4, UTF8_MB4"_czech_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  579. { 235, UTF8_MB4, UTF8_MB4"_danish_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  580. { 236, UTF8_MB4, UTF8_MB4"_lithuanian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  581. { 237, UTF8_MB4, UTF8_MB4"_slovak_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  582. { 238, UTF8_MB4, UTF8_MB4"_spanish2_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  583. { 239, UTF8_MB4, UTF8_MB4"_roman_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  584. { 240, UTF8_MB4, UTF8_MB4"_persian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  585. { 241, UTF8_MB4, UTF8_MB4"_esperanto_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  586. { 242, UTF8_MB4, UTF8_MB4"_hungarian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  587. { 243, UTF8_MB4, UTF8_MB4"_sinhala_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  588. { 244, UTF8_MB4, UTF8_MB4"_german2_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  589. { 245, UTF8_MB4, UTF8_MB4"_croatian_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  590. { 246, UTF8_MB4, UTF8_MB4"_unicode_520_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  591. { 247, UTF8_MB4, UTF8_MB4"_vietnamese_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  592. { 248, "gb18030", "gb18030_chinese_ci", 1, 4, "", mysqlnd_mbcharlen_gb18030, my_ismbchar_gb18030},
  593. { 249, "gb18030", "gb18030_bin", 1, 4, "", mysqlnd_mbcharlen_gb18030, my_ismbchar_gb18030},
  594. { 254, UTF8_MB3, UTF8_MB3"_general_cs", 1, 3, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  595. { 255, UTF8_MB4, UTF8_MB4"_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  596. { 256, UTF8_MB4, UTF8_MB4"_de_pb_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  597. { 257, UTF8_MB4, UTF8_MB4"_is_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  598. { 258, UTF8_MB4, UTF8_MB4"_lv_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  599. { 259, UTF8_MB4, UTF8_MB4"_ro_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  600. { 260, UTF8_MB4, UTF8_MB4"_sl_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  601. { 261, UTF8_MB4, UTF8_MB4"_pl_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  602. { 262, UTF8_MB4, UTF8_MB4"_et_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  603. { 263, UTF8_MB4, UTF8_MB4"_es_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  604. { 264, UTF8_MB4, UTF8_MB4"_sv_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  605. { 265, UTF8_MB4, UTF8_MB4"_tr_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  606. { 266, UTF8_MB4, UTF8_MB4"_cs_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  607. { 267, UTF8_MB4, UTF8_MB4"_da_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  608. { 268, UTF8_MB4, UTF8_MB4"_lt_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  609. { 269, UTF8_MB4, UTF8_MB4"_sk_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  610. { 270, UTF8_MB4, UTF8_MB4"_es_trad_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  611. { 271, UTF8_MB4, UTF8_MB4"_la_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  612. { 272, UTF8_MB4, UTF8_MB4"_fa_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  613. { 273, UTF8_MB4, UTF8_MB4"_eo_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  614. { 274, UTF8_MB4, UTF8_MB4"_hu_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  615. { 275, UTF8_MB4, UTF8_MB4"_hr_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  616. { 276, UTF8_MB4, UTF8_MB4"_si_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  617. { 277, UTF8_MB4, UTF8_MB4"_vi_0900_ai_ci", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  618. { 278, UTF8_MB4, UTF8_MB4"_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  619. { 279, UTF8_MB4, UTF8_MB4"_de_pb_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  620. { 280, UTF8_MB4, UTF8_MB4"_is_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  621. { 281, UTF8_MB4, UTF8_MB4"_lv_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  622. { 282, UTF8_MB4, UTF8_MB4"_ro_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  623. { 283, UTF8_MB4, UTF8_MB4"_sl_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  624. { 284, UTF8_MB4, UTF8_MB4"_pl_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  625. { 285, UTF8_MB4, UTF8_MB4"_et_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  626. { 286, UTF8_MB4, UTF8_MB4"_es_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  627. { 287, UTF8_MB4, UTF8_MB4"_sv_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  628. { 288, UTF8_MB4, UTF8_MB4"_tr_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  629. { 289, UTF8_MB4, UTF8_MB4"_cs_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  630. { 290, UTF8_MB4, UTF8_MB4"_da_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  631. { 291, UTF8_MB4, UTF8_MB4"_lt_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  632. { 292, UTF8_MB4, UTF8_MB4"_sk_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  633. { 293, UTF8_MB4, UTF8_MB4"_es_trad_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  634. { 294, UTF8_MB4, UTF8_MB4"_la_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  635. { 295, UTF8_MB4, UTF8_MB4"_fa_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  636. { 296, UTF8_MB4, UTF8_MB4"_eo_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  637. { 297, UTF8_MB4, UTF8_MB4"_hu_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  638. { 298, UTF8_MB4, UTF8_MB4"_hr_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  639. { 299, UTF8_MB4, UTF8_MB4"_si_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  640. { 300, UTF8_MB4, UTF8_MB4"_vi_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  641. { 303, UTF8_MB4, UTF8_MB4"_ja_0900_as_cs", 1, 4, "", mysqlnd_mbcharlen_utf8, check_mb_utf8_valid},
  642. { 0, NULL, NULL, 0, 0, NULL, NULL, NULL}
  643. };
  644. /* }}} */
  645. /* {{{ mysqlnd_find_charset_nr */
  646. PHPAPI const MYSQLND_CHARSET * mysqlnd_find_charset_nr(unsigned int charsetnr)
  647. {
  648. const MYSQLND_CHARSET * c = mysqlnd_charsets;
  649. do {
  650. if (c->nr == charsetnr) {
  651. return c;
  652. }
  653. ++c;
  654. } while (c[0].nr != 0);
  655. return NULL;
  656. }
  657. /* }}} */
  658. /* {{{ mysqlnd_find_charset_name */
  659. PHPAPI const MYSQLND_CHARSET * mysqlnd_find_charset_name(const char * const name)
  660. {
  661. if (name) {
  662. const MYSQLND_CHARSET * c = mysqlnd_charsets;
  663. do {
  664. if (!strcasecmp(c->name, name)) {
  665. return c;
  666. }
  667. ++c;
  668. } while (c[0].nr != 0);
  669. }
  670. return NULL;
  671. }
  672. /* }}} */
  673. /* {{{ mysqlnd_cset_escape_quotes */
  674. PHPAPI zend_ulong mysqlnd_cset_escape_quotes(const MYSQLND_CHARSET * const cset, char *newstr,
  675. const char * escapestr, size_t escapestr_len)
  676. {
  677. const char *newstr_s = newstr;
  678. const char *newstr_e = newstr + 2 * escapestr_len;
  679. const char *end = escapestr + escapestr_len;
  680. zend_bool escape_overflow = FALSE;
  681. DBG_ENTER("mysqlnd_cset_escape_quotes");
  682. for (;escapestr < end; escapestr++) {
  683. unsigned int len = 0;
  684. /* check unicode characters */
  685. if (cset->char_maxlen > 1 && (len = cset->mb_valid(escapestr, end))) {
  686. /* check possible overflow */
  687. if ((newstr + len) > newstr_e) {
  688. escape_overflow = TRUE;
  689. break;
  690. }
  691. /* copy mb char without escaping it */
  692. while (len--) {
  693. *newstr++ = *escapestr++;
  694. }
  695. escapestr--;
  696. continue;
  697. }
  698. if (*escapestr == '\'') {
  699. if (newstr + 2 > newstr_e) {
  700. escape_overflow = TRUE;
  701. break;
  702. }
  703. *newstr++ = '\'';
  704. *newstr++ = '\'';
  705. } else {
  706. if (newstr + 1 > newstr_e) {
  707. escape_overflow = TRUE;
  708. break;
  709. }
  710. *newstr++ = *escapestr;
  711. }
  712. }
  713. *newstr = '\0';
  714. if (escape_overflow) {
  715. DBG_RETURN((ulong)~0);
  716. }
  717. DBG_RETURN((ulong)(newstr - newstr_s));
  718. }
  719. /* }}} */
  720. /* {{{ mysqlnd_cset_escape_slashes */
  721. PHPAPI zend_ulong mysqlnd_cset_escape_slashes(const MYSQLND_CHARSET * const cset, char *newstr,
  722. const char * escapestr, size_t escapestr_len)
  723. {
  724. const char *newstr_s = newstr;
  725. const char *newstr_e = newstr + 2 * escapestr_len;
  726. const char *end = escapestr + escapestr_len;
  727. zend_bool escape_overflow = FALSE;
  728. DBG_ENTER("mysqlnd_cset_escape_slashes");
  729. DBG_INF_FMT("charset=%s", cset->name);
  730. for (;escapestr < end; escapestr++) {
  731. char esc = '\0';
  732. unsigned int len = 0;
  733. /* check unicode characters */
  734. if (cset->char_maxlen > 1 && (len = cset->mb_valid(escapestr, end))) {
  735. /* check possible overflow */
  736. if ((newstr + len) > newstr_e) {
  737. escape_overflow = TRUE;
  738. break;
  739. }
  740. /* copy mb char without escaping it */
  741. while (len--) {
  742. *newstr++ = *escapestr++;
  743. }
  744. escapestr--;
  745. continue;
  746. }
  747. if (cset->char_maxlen > 1 && cset->mb_charlen(*escapestr) > 1) {
  748. esc = *escapestr;
  749. } else {
  750. switch (*escapestr) {
  751. case 0:
  752. esc = '0';
  753. break;
  754. case '\n':
  755. esc = 'n';
  756. break;
  757. case '\r':
  758. esc = 'r';
  759. break;
  760. case '\\':
  761. case '\'':
  762. case '"':
  763. esc = *escapestr;
  764. break;
  765. case '\032':
  766. esc = 'Z';
  767. break;
  768. }
  769. }
  770. if (esc) {
  771. if (newstr + 2 > newstr_e) {
  772. escape_overflow = TRUE;
  773. break;
  774. }
  775. /* copy escaped character */
  776. *newstr++ = '\\';
  777. *newstr++ = esc;
  778. } else {
  779. if (newstr + 1 > newstr_e) {
  780. escape_overflow = TRUE;
  781. break;
  782. }
  783. /* copy non escaped character */
  784. *newstr++ = *escapestr;
  785. }
  786. }
  787. *newstr = '\0';
  788. if (escape_overflow) {
  789. DBG_RETURN((ulong)~0);
  790. }
  791. DBG_RETURN((ulong)(newstr - newstr_s));
  792. }
  793. /* }}} */
  794. static struct st_mysqlnd_plugin_charsets mysqlnd_plugin_charsets_plugin =
  795. {
  796. {
  797. MYSQLND_PLUGIN_API_VERSION,
  798. "charsets",
  799. MYSQLND_VERSION_ID,
  800. PHP_MYSQLND_VERSION,
  801. "PHP License 3.01",
  802. "Andrey Hristov <andrey@php.net>, Ulf Wendel <uw@php.net>, Georg Richter <georg@php.net>",
  803. {
  804. NULL, /* no statistics , will be filled later if there are some */
  805. NULL, /* no statistics */
  806. },
  807. {
  808. NULL /* plugin shutdown */
  809. }
  810. },
  811. {/* methods */
  812. mysqlnd_find_charset_nr,
  813. mysqlnd_find_charset_name,
  814. mysqlnd_cset_escape_quotes,
  815. mysqlnd_cset_escape_slashes
  816. }
  817. };
  818. /* {{{ mysqlnd_charsets_plugin_register */
  819. void
  820. mysqlnd_charsets_plugin_register(void)
  821. {
  822. mysqlnd_plugin_register_ex((struct st_mysqlnd_plugin_header *) &mysqlnd_plugin_charsets_plugin);
  823. }
  824. /* }}} */
  825. /*
  826. * Local variables:
  827. * tab-width: 4
  828. * c-basic-offset: 4
  829. * End:
  830. * vim600: noet sw=4 ts=4 fdm=marker
  831. * vim<600: noet sw=4 ts=4
  832. */