stringpiece.h 6.4 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224
  1. // Copyright (C) 2009-2013, International Business Machines
  2. // Corporation and others. All Rights Reserved.
  3. //
  4. // Copyright 2001 and onwards Google Inc.
  5. // Author: Sanjay Ghemawat
  6. // This code is a contribution of Google code, and the style used here is
  7. // a compromise between the original Google code and the ICU coding guidelines.
  8. // For example, data types are ICU-ified (size_t,int->int32_t),
  9. // and API comments doxygen-ified, but function names and behavior are
  10. // as in the original, if possible.
  11. // Assertion-style error handling, not available in ICU, was changed to
  12. // parameter "pinning" similar to UnicodeString.
  13. //
  14. // In addition, this is only a partial port of the original Google code,
  15. // limited to what was needed so far. The (nearly) complete original code
  16. // is in the ICU svn repository at icuhtml/trunk/design/strings/contrib
  17. // (see ICU ticket 6765, r25517).
  18. #ifndef __STRINGPIECE_H__
  19. #define __STRINGPIECE_H__
  20. /**
  21. * \file
  22. * \brief C++ API: StringPiece: Read-only byte string wrapper class.
  23. */
  24. #include "unicode/utypes.h"
  25. #include "unicode/uobject.h"
  26. #include "unicode/std_string.h"
  27. // Arghh! I wish C++ literals were "string".
  28. U_NAMESPACE_BEGIN
  29. /**
  30. * A string-like object that points to a sized piece of memory.
  31. *
  32. * We provide non-explicit singleton constructors so users can pass
  33. * in a "const char*" or a "string" wherever a "StringPiece" is
  34. * expected.
  35. *
  36. * Functions or methods may use const StringPiece& parameters to accept either
  37. * a "const char*" or a "string" value that will be implicitly converted to
  38. * a StringPiece.
  39. *
  40. * Systematic usage of StringPiece is encouraged as it will reduce unnecessary
  41. * conversions from "const char*" to "string" and back again.
  42. *
  43. * @stable ICU 4.2
  44. */
  45. class U_COMMON_API StringPiece : public UMemory {
  46. private:
  47. const char* ptr_;
  48. int32_t length_;
  49. public:
  50. /**
  51. * Default constructor, creates an empty StringPiece.
  52. * @stable ICU 4.2
  53. */
  54. StringPiece() : ptr_(NULL), length_(0) { }
  55. /**
  56. * Constructs from a NUL-terminated const char * pointer.
  57. * @param str a NUL-terminated const char * pointer
  58. * @stable ICU 4.2
  59. */
  60. StringPiece(const char* str);
  61. #if U_HAVE_STD_STRING
  62. /**
  63. * Constructs from a std::string.
  64. * @stable ICU 4.2
  65. */
  66. StringPiece(const std::string& str)
  67. : ptr_(str.data()), length_(static_cast<int32_t>(str.size())) { }
  68. #endif
  69. /**
  70. * Constructs from a const char * pointer and a specified length.
  71. * @param offset a const char * pointer (need not be terminated)
  72. * @param len the length of the string; must be non-negative
  73. * @stable ICU 4.2
  74. */
  75. StringPiece(const char* offset, int32_t len) : ptr_(offset), length_(len) { }
  76. /**
  77. * Substring of another StringPiece.
  78. * @param x the other StringPiece
  79. * @param pos start position in x; must be non-negative and <= x.length().
  80. * @stable ICU 4.2
  81. */
  82. StringPiece(const StringPiece& x, int32_t pos);
  83. /**
  84. * Substring of another StringPiece.
  85. * @param x the other StringPiece
  86. * @param pos start position in x; must be non-negative and <= x.length().
  87. * @param len length of the substring;
  88. * must be non-negative and will be pinned to at most x.length() - pos.
  89. * @stable ICU 4.2
  90. */
  91. StringPiece(const StringPiece& x, int32_t pos, int32_t len);
  92. /**
  93. * Returns the string pointer. May be NULL if it is empty.
  94. *
  95. * data() may return a pointer to a buffer with embedded NULs, and the
  96. * returned buffer may or may not be null terminated. Therefore it is
  97. * typically a mistake to pass data() to a routine that expects a NUL
  98. * terminated string.
  99. * @return the string pointer
  100. * @stable ICU 4.2
  101. */
  102. const char* data() const { return ptr_; }
  103. /**
  104. * Returns the string length. Same as length().
  105. * @return the string length
  106. * @stable ICU 4.2
  107. */
  108. int32_t size() const { return length_; }
  109. /**
  110. * Returns the string length. Same as size().
  111. * @return the string length
  112. * @stable ICU 4.2
  113. */
  114. int32_t length() const { return length_; }
  115. /**
  116. * Returns whether the string is empty.
  117. * @return TRUE if the string is empty
  118. * @stable ICU 4.2
  119. */
  120. UBool empty() const { return length_ == 0; }
  121. /**
  122. * Sets to an empty string.
  123. * @stable ICU 4.2
  124. */
  125. void clear() { ptr_ = NULL; length_ = 0; }
  126. /**
  127. * Reset the stringpiece to refer to new data.
  128. * @param xdata pointer the new string data. Need not be nul terminated.
  129. * @param len the length of the new data
  130. * @stable ICU 4.8
  131. */
  132. void set(const char* xdata, int32_t len) { ptr_ = xdata; length_ = len; }
  133. /**
  134. * Reset the stringpiece to refer to new data.
  135. * @param str a pointer to a NUL-terminated string.
  136. * @stable ICU 4.8
  137. */
  138. void set(const char* str);
  139. /**
  140. * Removes the first n string units.
  141. * @param n prefix length, must be non-negative and <=length()
  142. * @stable ICU 4.2
  143. */
  144. void remove_prefix(int32_t n) {
  145. if (n >= 0) {
  146. if (n > length_) {
  147. n = length_;
  148. }
  149. ptr_ += n;
  150. length_ -= n;
  151. }
  152. }
  153. /**
  154. * Removes the last n string units.
  155. * @param n suffix length, must be non-negative and <=length()
  156. * @stable ICU 4.2
  157. */
  158. void remove_suffix(int32_t n) {
  159. if (n >= 0) {
  160. if (n <= length_) {
  161. length_ -= n;
  162. } else {
  163. length_ = 0;
  164. }
  165. }
  166. }
  167. /**
  168. * Maximum integer, used as a default value for substring methods.
  169. * @stable ICU 4.2
  170. */
  171. static const int32_t npos; // = 0x7fffffff;
  172. /**
  173. * Returns a substring of this StringPiece.
  174. * @param pos start position; must be non-negative and <= length().
  175. * @param len length of the substring;
  176. * must be non-negative and will be pinned to at most length() - pos.
  177. * @return the substring StringPiece
  178. * @stable ICU 4.2
  179. */
  180. StringPiece substr(int32_t pos, int32_t len = npos) const {
  181. return StringPiece(*this, pos, len);
  182. }
  183. };
  184. /**
  185. * Global operator == for StringPiece
  186. * @param x The first StringPiece to compare.
  187. * @param y The second StringPiece to compare.
  188. * @return TRUE if the string data is equal
  189. * @stable ICU 4.8
  190. */
  191. U_EXPORT UBool U_EXPORT2
  192. operator==(const StringPiece& x, const StringPiece& y);
  193. /**
  194. * Global operator != for StringPiece
  195. * @param x The first StringPiece to compare.
  196. * @param y The second StringPiece to compare.
  197. * @return TRUE if the string data is not equal
  198. * @stable ICU 4.8
  199. */
  200. inline UBool operator!=(const StringPiece& x, const StringPiece& y) {
  201. return !(x == y);
  202. }
  203. U_NAMESPACE_END
  204. #endif // __STRINGPIECE_H__