intl_convert.c 4.9 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. /*
  2. +----------------------------------------------------------------------+
  3. | PHP Version 5 |
  4. +----------------------------------------------------------------------+
  5. | This source file is subject to version 3.01 of the PHP license, |
  6. | that is bundled with this package in the file LICENSE, and is |
  7. | available through the world-wide-web at the following url: |
  8. | http://www.php.net/license/3_01.txt |
  9. | If you did not receive a copy of the PHP license and are unable to |
  10. | obtain it through the world-wide-web, please send a note to |
  11. | license@php.net so we can mail you a copy immediately. |
  12. +----------------------------------------------------------------------+
  13. | Authors: Vadim Savchuk <vsavchuk@productengine.com> |
  14. | Dmitry Lakhtyuk <dlakhtyuk@productengine.com> |
  15. +----------------------------------------------------------------------+
  16. */
  17. #ifdef HAVE_CONFIG_H
  18. #include "config.h"
  19. #endif
  20. #include <php.h>
  21. #include "intl_common.h"
  22. #include "intl_convert.h"
  23. /* {{{ intl_convert_utf8_to_utf16
  24. * Convert given string from UTF-8 to UTF-16 to *target buffer.
  25. *
  26. * It *target is NULL then we allocate a large enough buffer,
  27. * store the converted string into it, and make target point to it.
  28. *
  29. * Otherwise, if *target is non-NULL, we assume that it points to a
  30. * dynamically allocated buffer of *target_len bytes length.
  31. * In this case the buffer will be used to store the converted string to,
  32. * and may be resized (made larger) if needed.
  33. *
  34. * @param target Where to place the result.
  35. * @param target_len Result length.
  36. * @param source String to convert.
  37. * @param source_len Length of the source string.
  38. * @param status Conversion status.
  39. *
  40. * @return void This function does not return anything.
  41. */
  42. void intl_convert_utf8_to_utf16(
  43. UChar** target, int* target_len,
  44. const char* src, int src_len,
  45. UErrorCode* status )
  46. {
  47. UChar* dst_buf = NULL;
  48. uint32_t dst_len = 0;
  49. /* If *target is NULL determine required destination buffer size (pre-flighting).
  50. * Otherwise, attempt to convert source string; if *target buffer is not large enough
  51. * it will be resized appropriately.
  52. */
  53. *status = U_ZERO_ERROR;
  54. u_strFromUTF8( *target, *target_len, &dst_len, src, src_len, status );
  55. if( *status == U_ZERO_ERROR )
  56. {
  57. /* String is converted successfuly */
  58. (*target)[dst_len] = 0;
  59. *target_len = dst_len;
  60. return;
  61. }
  62. /* Bail out if an unexpected error occurred.
  63. * (U_BUFFER_OVERFLOW_ERROR means that *target buffer is not large enough).
  64. * (U_STRING_NOT_TERMINATED_WARNING usually means that the input string is empty).
  65. */
  66. if( *status != U_BUFFER_OVERFLOW_ERROR && *status != U_STRING_NOT_TERMINATED_WARNING )
  67. return;
  68. /* Allocate memory for the destination buffer (it will be zero-terminated). */
  69. dst_buf = eumalloc( dst_len + 1 );
  70. /* Convert source string from UTF-8 to UTF-16. */
  71. *status = U_ZERO_ERROR;
  72. u_strFromUTF8( dst_buf, dst_len+1, NULL, src, src_len, status );
  73. if( U_FAILURE( *status ) )
  74. {
  75. efree( dst_buf );
  76. return;
  77. }
  78. dst_buf[dst_len] = 0;
  79. if( *target )
  80. efree( *target );
  81. *target = dst_buf;
  82. *target_len = dst_len;
  83. }
  84. /* }}} */
  85. /* {{{ intl_convert_utf16_to_utf8
  86. * Convert given string from UTF-16 to UTF-8.
  87. *
  88. * @param target Where to place the result.
  89. * @param target_len Result length.
  90. * @param source String to convert.
  91. * @param source_len Length of the source string.
  92. * @param status Conversion status.
  93. *
  94. * @return void This function does not return anything.
  95. */
  96. void intl_convert_utf16_to_utf8(
  97. char** target, int* target_len,
  98. const UChar* src, int src_len,
  99. UErrorCode* status )
  100. {
  101. char* dst_buf = NULL;
  102. int32_t dst_len;
  103. /* Determine required destination buffer size (pre-flighting). */
  104. *status = U_ZERO_ERROR;
  105. u_strToUTF8( NULL, 0, &dst_len, src, src_len, status );
  106. /* Bail out if an unexpected error occurred.
  107. * (U_BUFFER_OVERFLOW_ERROR means that *target buffer is not large enough).
  108. * (U_STRING_NOT_TERMINATED_WARNING usually means that the input string is empty).
  109. */
  110. if( *status != U_BUFFER_OVERFLOW_ERROR && *status != U_STRING_NOT_TERMINATED_WARNING )
  111. return;
  112. /* Allocate memory for the destination buffer (it will be zero-terminated). */
  113. dst_buf = emalloc( dst_len+1 );
  114. /* Convert source string from UTF-8 to UTF-16. */
  115. *status = U_ZERO_ERROR;
  116. u_strToUTF8( dst_buf, dst_len, NULL, src, src_len, status );
  117. if( U_FAILURE( *status ) )
  118. {
  119. efree( dst_buf );
  120. return;
  121. }
  122. /* U_STRING_NOT_TERMINATED_WARNING is OK for us => reset 'status'. */
  123. *status = U_ZERO_ERROR;
  124. dst_buf[dst_len] = 0;
  125. *target = dst_buf;
  126. *target_len = dst_len;
  127. }
  128. /* }}} */
  129. /*
  130. * Local variables:
  131. * tab-width: 4
  132. * c-basic-offset: 4
  133. * End:
  134. * vim600: noet sw=4 ts=4 fdm=marker
  135. * vim<600: noet sw=4 ts=4
  136. */