mb_ereg_variation6.phpt 3.5 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192
  1. --TEST--
  2. Test mb_ereg() function : usage variations - match special characters
  3. --SKIPIF--
  4. <?php
  5. extension_loaded('mbstring') or die('skip');
  6. function_exists('mb_ereg') or die("skip mb_ereg() is not available in this build");
  7. ?>
  8. --FILE--
  9. <?php
  10. /* Prototype : int mb_ereg(string $pattern, string $string [, array $registers])
  11. * Description: Regular expression match for multibyte string
  12. * Source code: ext/mbstring/php_mbregex.c
  13. */
  14. /*
  15. * Test how mb_ereg() matches special characters for $pattern
  16. */
  17. echo "*** Testing mb_ereg() : usage variations ***\n";
  18. if(mb_regex_encoding('utf-8') == true) {
  19. echo "Regex encoding set to utf-8\n";
  20. } else {
  21. echo "Could not set regex encoding to utf-8\n";
  22. }
  23. $regex_char = array ('\w+' => b'\w+',
  24. '\W+' => b'\W+',
  25. '\s+' => b'\s+',
  26. '\S+' => b'\S+',
  27. '\d+' => b'\d+',
  28. '\D+' => b'\D+',
  29. '\b' => b'\b',
  30. '\B' => b'\B');
  31. $string_ascii = b'This is an English string. 0123456789.';
  32. $string_mb = base64_decode('5pel5pys6Kqe44OG44Kt44K544OI44Gn44GZ44CCMDEyMzTvvJXvvJbvvJfvvJjvvJnjgII=');
  33. foreach ($regex_char as $displayChar => $char) {
  34. echo "\n--** Pattern is: $displayChar **--\n";
  35. if (@$regs_ascii || @$regs_mb) {
  36. $regs_ascii = null;
  37. $regs_mb = null;
  38. }
  39. echo "-- ASCII String: --\n";
  40. var_dump(mb_ereg($char, $string_ascii, $regs_ascii));
  41. base64_encode_var_dump($regs_ascii);
  42. echo "-- Multibyte String: --\n";
  43. var_dump(mb_ereg($char, $string_mb, $regs_mb));
  44. base64_encode_var_dump($regs_mb);
  45. }
  46. /**
  47. * replicate a var dump of an array but outputted string values are base64 encoded
  48. *
  49. * @param array $regs
  50. */
  51. function base64_encode_var_dump($regs) {
  52. if ($regs) {
  53. echo "array(" . count($regs) . ") {\n";
  54. foreach ($regs as $key => $value) {
  55. echo " [$key]=>\n ";
  56. if (is_string($value)) {
  57. var_dump(base64_encode($value));
  58. } else {
  59. var_dump($value);
  60. }
  61. }
  62. echo "}\n";
  63. } else {
  64. echo "NULL\n";
  65. }
  66. }
  67. echo "Done";
  68. ?>
  69. --EXPECT--
  70. *** Testing mb_ereg() : usage variations ***
  71. Regex encoding set to utf-8
  72. --** Pattern is: \w+ **--
  73. -- ASCII String: --
  74. int(4)
  75. array(1) {
  76. [0]=>
  77. string(8) "VGhpcw=="
  78. }
  79. -- Multibyte String: --
  80. int(27)
  81. array(1) {
  82. [0]=>
  83. string(36) "5pel5pys6Kqe44OG44Kt44K544OI44Gn44GZ"
  84. }
  85. --** Pattern is: \W+ **--
  86. -- ASCII String: --
  87. int(1)
  88. array(1) {
  89. [0]=>
  90. string(4) "IA=="
  91. }
  92. -- Multibyte String: --
  93. int(3)
  94. array(1) {
  95. [0]=>
  96. string(4) "44CC"
  97. }
  98. --** Pattern is: \s+ **--
  99. -- ASCII String: --
  100. int(1)
  101. array(1) {
  102. [0]=>
  103. string(4) "IA=="
  104. }
  105. -- Multibyte String: --
  106. bool(false)
  107. NULL
  108. --** Pattern is: \S+ **--
  109. -- ASCII String: --
  110. int(4)
  111. array(1) {
  112. [0]=>
  113. string(8) "VGhpcw=="
  114. }
  115. -- Multibyte String: --
  116. int(53)
  117. array(1) {
  118. [0]=>
  119. string(72) "5pel5pys6Kqe44OG44Kt44K544OI44Gn44GZ44CCMDEyMzTvvJXvvJbvvJfvvJjvvJnjgII="
  120. }
  121. --** Pattern is: \d+ **--
  122. -- ASCII String: --
  123. int(10)
  124. array(1) {
  125. [0]=>
  126. string(16) "MDEyMzQ1Njc4OQ=="
  127. }
  128. -- Multibyte String: --
  129. int(20)
  130. array(1) {
  131. [0]=>
  132. string(28) "MDEyMzTvvJXvvJbvvJfvvJjvvJk="
  133. }
  134. --** Pattern is: \D+ **--
  135. -- ASCII String: --
  136. int(27)
  137. array(1) {
  138. [0]=>
  139. string(36) "VGhpcyBpcyBhbiBFbmdsaXNoIHN0cmluZy4g"
  140. }
  141. -- Multibyte String: --
  142. int(30)
  143. array(1) {
  144. [0]=>
  145. string(40) "5pel5pys6Kqe44OG44Kt44K544OI44Gn44GZ44CC"
  146. }
  147. --** Pattern is: \b **--
  148. -- ASCII String: --
  149. int(1)
  150. array(1) {
  151. [0]=>
  152. bool(false)
  153. }
  154. -- Multibyte String: --
  155. int(1)
  156. array(1) {
  157. [0]=>
  158. bool(false)
  159. }
  160. --** Pattern is: \B **--
  161. -- ASCII String: --
  162. int(1)
  163. array(1) {
  164. [0]=>
  165. bool(false)
  166. }
  167. -- Multibyte String: --
  168. int(1)
  169. array(1) {
  170. [0]=>
  171. bool(false)
  172. }
  173. Done