breakiterator_class.cpp 13 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377
  1. /*
  2. +----------------------------------------------------------------------+
  3. | PHP Version 7 |
  4. +----------------------------------------------------------------------+
  5. | This source file is subject to version 3.01 of the PHP license, |
  6. | that is bundled with this package in the file LICENSE, and is |
  7. | available through the world-wide-web at the following url: |
  8. | http://www.php.net/license/3_01.txt |
  9. | If you did not receive a copy of the PHP license and are unable to |
  10. | obtain it through the world-wide-web, please send a note to |
  11. | license@php.net so we can mail you a copy immediately. |
  12. +----------------------------------------------------------------------+
  13. | Authors: Gustavo Lopes <cataphract@php.net> |
  14. +----------------------------------------------------------------------+
  15. */
  16. #ifdef HAVE_CONFIG_H
  17. #include "config.h"
  18. #endif
  19. #include <unicode/brkiter.h>
  20. #include <unicode/rbbi.h>
  21. #include "codepointiterator_internal.h"
  22. #include "breakiterator_iterators.h"
  23. #include <typeinfo>
  24. extern "C" {
  25. #define USE_BREAKITERATOR_POINTER 1
  26. #include "breakiterator_class.h"
  27. #include "breakiterator_methods.h"
  28. #include "rulebasedbreakiterator_methods.h"
  29. #include "codepointiterator_methods.h"
  30. #include <zend_exceptions.h>
  31. #include <zend_interfaces.h>
  32. #include <assert.h>
  33. }
  34. using PHP::CodePointBreakIterator;
  35. using icu::RuleBasedBreakIterator;
  36. /* {{{ Global variables */
  37. zend_class_entry *BreakIterator_ce_ptr;
  38. zend_class_entry *RuleBasedBreakIterator_ce_ptr;
  39. zend_class_entry *CodePointBreakIterator_ce_ptr;
  40. zend_object_handlers BreakIterator_handlers;
  41. /* }}} */
  42. U_CFUNC void breakiterator_object_create(zval *object,
  43. BreakIterator *biter, int brand_new)
  44. {
  45. UClassID classId = biter->getDynamicClassID();
  46. zend_class_entry *ce;
  47. if (classId == RuleBasedBreakIterator::getStaticClassID()) {
  48. ce = RuleBasedBreakIterator_ce_ptr;
  49. } else if (classId == CodePointBreakIterator::getStaticClassID()) {
  50. ce = CodePointBreakIterator_ce_ptr;
  51. } else {
  52. ce = BreakIterator_ce_ptr;
  53. }
  54. if (brand_new) {
  55. object_init_ex(object, ce);
  56. }
  57. breakiterator_object_construct(object, biter);
  58. }
  59. U_CFUNC void breakiterator_object_construct(zval *object,
  60. BreakIterator *biter)
  61. {
  62. BreakIterator_object *bio;
  63. BREAKITER_METHOD_FETCH_OBJECT_NO_CHECK; //populate to from object
  64. assert(bio->biter == NULL);
  65. bio->biter = biter;
  66. }
  67. /* {{{ compare handler for BreakIterator */
  68. static int BreakIterator_compare_objects(zval *object1,
  69. zval *object2)
  70. {
  71. BreakIterator_object *bio1,
  72. *bio2;
  73. bio1 = Z_INTL_BREAKITERATOR_P(object1);
  74. bio2 = Z_INTL_BREAKITERATOR_P(object2);
  75. if (bio1->biter == NULL || bio2->biter == NULL) {
  76. return bio1->biter == bio2->biter ? 0 : 1;
  77. }
  78. return *bio1->biter == *bio2->biter ? 0 : 1;
  79. }
  80. /* }}} */
  81. /* {{{ clone handler for BreakIterator */
  82. static zend_object *BreakIterator_clone_obj(zval *object)
  83. {
  84. BreakIterator_object *bio_orig,
  85. *bio_new;
  86. zend_object *ret_val;
  87. bio_orig = Z_INTL_BREAKITERATOR_P(object);
  88. intl_errors_reset(INTL_DATA_ERROR_P(bio_orig));
  89. ret_val = BreakIterator_ce_ptr->create_object(Z_OBJCE_P(object));
  90. bio_new = php_intl_breakiterator_fetch_object(ret_val);
  91. zend_objects_clone_members(&bio_new->zo, &bio_orig->zo);
  92. if (bio_orig->biter != NULL) {
  93. BreakIterator *new_biter;
  94. new_biter = bio_orig->biter->clone();
  95. if (!new_biter) {
  96. zend_string *err_msg;
  97. intl_errors_set_code(BREAKITER_ERROR_P(bio_orig),
  98. U_MEMORY_ALLOCATION_ERROR);
  99. intl_errors_set_custom_msg(BREAKITER_ERROR_P(bio_orig),
  100. "Could not clone BreakIterator", 0);
  101. err_msg = intl_error_get_message(BREAKITER_ERROR_P(bio_orig));
  102. zend_throw_exception(NULL, ZSTR_VAL(err_msg), 0);
  103. zend_string_free(err_msg);
  104. } else {
  105. bio_new->biter = new_biter;
  106. ZVAL_COPY(&bio_new->text, &bio_orig->text);
  107. }
  108. } else {
  109. zend_throw_exception(NULL, "Cannot clone unconstructed BreakIterator", 0);
  110. }
  111. return ret_val;
  112. }
  113. /* }}} */
  114. /* {{{ get_debug_info handler for BreakIterator */
  115. static HashTable *BreakIterator_get_debug_info(zval *object, int *is_temp)
  116. {
  117. zval val;
  118. HashTable *debug_info;
  119. BreakIterator_object *bio;
  120. const BreakIterator *biter;
  121. *is_temp = 1;
  122. debug_info = zend_new_array(8);
  123. bio = Z_INTL_BREAKITERATOR_P(object);
  124. biter = bio->biter;
  125. if (biter == NULL) {
  126. ZVAL_FALSE(&val);
  127. zend_hash_str_update(debug_info, "valid", sizeof("valid") - 1, &val);
  128. return debug_info;
  129. }
  130. ZVAL_TRUE(&val);
  131. zend_hash_str_update(debug_info, "valid", sizeof("valid") - 1, &val);
  132. if (Z_ISUNDEF(bio->text)) {
  133. ZVAL_NULL(&val);
  134. zend_hash_str_update(debug_info, "text", sizeof("text") - 1, &val);
  135. } else {
  136. Z_TRY_ADDREF(bio->text);
  137. zend_hash_str_update(debug_info, "text", sizeof("text") - 1, &bio->text);
  138. }
  139. ZVAL_STRING(&val, const_cast<char*>(typeid(*biter).name()));
  140. zend_hash_str_update(debug_info, "type", sizeof("type") - 1, &val);
  141. return debug_info;
  142. }
  143. /* }}} */
  144. /* {{{ void breakiterator_object_init(BreakIterator_object* to)
  145. * Initialize internals of BreakIterator_object not specific to zend standard objects.
  146. */
  147. static void breakiterator_object_init(BreakIterator_object *bio)
  148. {
  149. intl_error_init(BREAKITER_ERROR_P(bio));
  150. bio->biter = NULL;
  151. ZVAL_UNDEF(&bio->text);
  152. }
  153. /* }}} */
  154. /* {{{ BreakIterator_objects_free */
  155. static void BreakIterator_objects_free(zend_object *object)
  156. {
  157. BreakIterator_object* bio = php_intl_breakiterator_fetch_object(object);
  158. zval_ptr_dtor(&bio->text);
  159. if (bio->biter) {
  160. delete bio->biter;
  161. bio->biter = NULL;
  162. }
  163. intl_error_reset(BREAKITER_ERROR_P(bio));
  164. zend_object_std_dtor(&bio->zo);
  165. }
  166. /* }}} */
  167. /* {{{ BreakIterator_object_create */
  168. static zend_object *BreakIterator_object_create(zend_class_entry *ce)
  169. {
  170. BreakIterator_object* intern;
  171. intern = (BreakIterator_object*)ecalloc(1, sizeof(BreakIterator_object) + sizeof(zval) * (ce->default_properties_count - 1));
  172. zend_object_std_init(&intern->zo, ce);
  173. object_properties_init((zend_object*) intern, ce);
  174. breakiterator_object_init(intern);
  175. intern->zo.handlers = &BreakIterator_handlers;
  176. return &intern->zo;
  177. }
  178. /* }}} */
  179. /* {{{ BreakIterator/RuleBasedBreakIterator methods arguments info */
  180. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_void, 0, 0, 0)
  181. ZEND_END_ARG_INFO()
  182. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_locale, 0, 0, 0)
  183. ZEND_ARG_INFO(0, locale)
  184. ZEND_END_ARG_INFO()
  185. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_setText, 0, 0, 1)
  186. ZEND_ARG_INFO(0, text)
  187. ZEND_END_ARG_INFO()
  188. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_next, 0, 0, 0)
  189. ZEND_ARG_INFO(0, offset)
  190. ZEND_END_ARG_INFO()
  191. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_offset, 0, 0, 1)
  192. ZEND_ARG_INFO(0, offset)
  193. ZEND_END_ARG_INFO()
  194. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_get_locale, 0, 0, 1)
  195. ZEND_ARG_INFO(0, locale_type)
  196. ZEND_END_ARG_INFO()
  197. ZEND_BEGIN_ARG_INFO_EX(ainfo_biter_getPartsIterator, 0, 0, 0)
  198. ZEND_ARG_INFO(0, key_type)
  199. ZEND_END_ARG_INFO()
  200. ZEND_BEGIN_ARG_INFO_EX(ainfo_rbbi___construct, 0, 0, 1)
  201. ZEND_ARG_INFO(0, rules)
  202. ZEND_ARG_INFO(0, areCompiled)
  203. ZEND_END_ARG_INFO()
  204. /* }}} */
  205. /* {{{ BreakIterator_class_functions
  206. * Every 'BreakIterator' class method has an entry in this table
  207. */
  208. static const zend_function_entry BreakIterator_class_functions[] = {
  209. PHP_ME(BreakIterator, __construct, ainfo_biter_void, ZEND_ACC_PRIVATE)
  210. PHP_ME_MAPPING(createWordInstance, breakiter_create_word_instance, ainfo_biter_locale, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  211. PHP_ME_MAPPING(createLineInstance, breakiter_create_line_instance, ainfo_biter_locale, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  212. PHP_ME_MAPPING(createCharacterInstance, breakiter_create_character_instance, ainfo_biter_locale, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  213. PHP_ME_MAPPING(createSentenceInstance, breakiter_create_sentence_instance, ainfo_biter_locale, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  214. PHP_ME_MAPPING(createTitleInstance, breakiter_create_title_instance, ainfo_biter_locale, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  215. PHP_ME_MAPPING(createCodePointInstance, breakiter_create_code_point_instance, ainfo_biter_void, ZEND_ACC_STATIC | ZEND_ACC_PUBLIC)
  216. PHP_ME_MAPPING(getText, breakiter_get_text, ainfo_biter_void, ZEND_ACC_PUBLIC)
  217. PHP_ME_MAPPING(setText, breakiter_set_text, ainfo_biter_setText, ZEND_ACC_PUBLIC)
  218. PHP_ME_MAPPING(first, breakiter_first, ainfo_biter_void, ZEND_ACC_PUBLIC)
  219. PHP_ME_MAPPING(last, breakiter_last, ainfo_biter_void, ZEND_ACC_PUBLIC)
  220. PHP_ME_MAPPING(previous, breakiter_previous, ainfo_biter_void, ZEND_ACC_PUBLIC)
  221. PHP_ME_MAPPING(next, breakiter_next, ainfo_biter_next, ZEND_ACC_PUBLIC)
  222. PHP_ME_MAPPING(current, breakiter_current, ainfo_biter_void, ZEND_ACC_PUBLIC)
  223. PHP_ME_MAPPING(following, breakiter_following, ainfo_biter_offset, ZEND_ACC_PUBLIC)
  224. PHP_ME_MAPPING(preceding, breakiter_preceding, ainfo_biter_offset, ZEND_ACC_PUBLIC)
  225. PHP_ME_MAPPING(isBoundary, breakiter_is_boundary, ainfo_biter_offset, ZEND_ACC_PUBLIC)
  226. PHP_ME_MAPPING(getLocale, breakiter_get_locale, ainfo_biter_get_locale, ZEND_ACC_PUBLIC)
  227. PHP_ME_MAPPING(getPartsIterator, breakiter_get_parts_iterator, ainfo_biter_getPartsIterator, ZEND_ACC_PUBLIC)
  228. PHP_ME_MAPPING(getErrorCode, breakiter_get_error_code, ainfo_biter_void, ZEND_ACC_PUBLIC)
  229. PHP_ME_MAPPING(getErrorMessage, breakiter_get_error_message, ainfo_biter_void, ZEND_ACC_PUBLIC)
  230. PHP_FE_END
  231. };
  232. /* }}} */
  233. /* {{{ RuleBasedBreakIterator_class_functions
  234. */
  235. static const zend_function_entry RuleBasedBreakIterator_class_functions[] = {
  236. PHP_ME(IntlRuleBasedBreakIterator, __construct, ainfo_rbbi___construct, ZEND_ACC_PUBLIC)
  237. PHP_ME_MAPPING(getRules, rbbi_get_rules, ainfo_biter_void, ZEND_ACC_PUBLIC)
  238. PHP_ME_MAPPING(getRuleStatus, rbbi_get_rule_status, ainfo_biter_void, ZEND_ACC_PUBLIC)
  239. PHP_ME_MAPPING(getRuleStatusVec, rbbi_get_rule_status_vec, ainfo_biter_void, ZEND_ACC_PUBLIC)
  240. #if U_ICU_VERSION_MAJOR_NUM * 10 + U_ICU_VERSION_MINOR_NUM >= 48
  241. PHP_ME_MAPPING(getBinaryRules, rbbi_get_binary_rules, ainfo_biter_void, ZEND_ACC_PUBLIC)
  242. #endif
  243. PHP_FE_END
  244. };
  245. /* }}} */
  246. /* {{{ CodePointBreakIterator_class_functions
  247. */
  248. static const zend_function_entry CodePointBreakIterator_class_functions[] = {
  249. PHP_ME_MAPPING(getLastCodePoint, cpbi_get_last_code_point, ainfo_biter_void, ZEND_ACC_PUBLIC)
  250. PHP_FE_END
  251. };
  252. /* }}} */
  253. /* {{{ breakiterator_register_BreakIterator_class
  254. * Initialize 'BreakIterator' class
  255. */
  256. U_CFUNC void breakiterator_register_BreakIterator_class(void)
  257. {
  258. zend_class_entry ce;
  259. /* Create and register 'BreakIterator' class. */
  260. INIT_CLASS_ENTRY(ce, "IntlBreakIterator", BreakIterator_class_functions);
  261. ce.create_object = BreakIterator_object_create;
  262. ce.get_iterator = _breakiterator_get_iterator;
  263. BreakIterator_ce_ptr = zend_register_internal_class(&ce);
  264. memcpy(&BreakIterator_handlers, &std_object_handlers,
  265. sizeof BreakIterator_handlers);
  266. BreakIterator_handlers.offset = XtOffsetOf(BreakIterator_object, zo);
  267. BreakIterator_handlers.compare_objects = BreakIterator_compare_objects;
  268. BreakIterator_handlers.clone_obj = BreakIterator_clone_obj;
  269. BreakIterator_handlers.get_debug_info = BreakIterator_get_debug_info;
  270. BreakIterator_handlers.free_obj = BreakIterator_objects_free;
  271. zend_class_implements(BreakIterator_ce_ptr, 1,
  272. zend_ce_traversable);
  273. zend_declare_class_constant_long(BreakIterator_ce_ptr,
  274. "DONE", sizeof("DONE") - 1, BreakIterator::DONE );
  275. /* Declare constants that are defined in the C header */
  276. #define BREAKITER_DECL_LONG_CONST(name) \
  277. zend_declare_class_constant_long(BreakIterator_ce_ptr, #name, \
  278. sizeof(#name) - 1, UBRK_ ## name)
  279. BREAKITER_DECL_LONG_CONST(WORD_NONE);
  280. BREAKITER_DECL_LONG_CONST(WORD_NONE_LIMIT);
  281. BREAKITER_DECL_LONG_CONST(WORD_NUMBER);
  282. BREAKITER_DECL_LONG_CONST(WORD_NUMBER_LIMIT);
  283. BREAKITER_DECL_LONG_CONST(WORD_LETTER);
  284. BREAKITER_DECL_LONG_CONST(WORD_LETTER_LIMIT);
  285. BREAKITER_DECL_LONG_CONST(WORD_KANA);
  286. BREAKITER_DECL_LONG_CONST(WORD_KANA_LIMIT);
  287. BREAKITER_DECL_LONG_CONST(WORD_IDEO);
  288. BREAKITER_DECL_LONG_CONST(WORD_IDEO_LIMIT);
  289. BREAKITER_DECL_LONG_CONST(LINE_SOFT);
  290. BREAKITER_DECL_LONG_CONST(LINE_SOFT_LIMIT);
  291. BREAKITER_DECL_LONG_CONST(LINE_HARD);
  292. BREAKITER_DECL_LONG_CONST(LINE_HARD_LIMIT);
  293. BREAKITER_DECL_LONG_CONST(SENTENCE_TERM);
  294. BREAKITER_DECL_LONG_CONST(SENTENCE_TERM_LIMIT);
  295. BREAKITER_DECL_LONG_CONST(SENTENCE_SEP);
  296. BREAKITER_DECL_LONG_CONST(SENTENCE_SEP_LIMIT);
  297. #undef BREAKITER_DECL_LONG_CONST
  298. /* Create and register 'RuleBasedBreakIterator' class. */
  299. INIT_CLASS_ENTRY(ce, "IntlRuleBasedBreakIterator",
  300. RuleBasedBreakIterator_class_functions);
  301. RuleBasedBreakIterator_ce_ptr = zend_register_internal_class_ex(&ce,
  302. BreakIterator_ce_ptr);
  303. /* Create and register 'CodePointBreakIterator' class. */
  304. INIT_CLASS_ENTRY(ce, "IntlCodePointBreakIterator",
  305. CodePointBreakIterator_class_functions);
  306. CodePointBreakIterator_ce_ptr = zend_register_internal_class_ex(&ce,
  307. BreakIterator_ce_ptr);
  308. }
  309. /* }}} */