region.h 9.0 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222
  1. /*
  2. *******************************************************************************
  3. * Copyright (C) 2014-2016, International Business Machines Corporation and others.
  4. * All Rights Reserved.
  5. *******************************************************************************
  6. */
  7. #ifndef REGION_H
  8. #define REGION_H
  9. /**
  10. * \file
  11. * \brief C++ API: Region classes (territory containment)
  12. */
  13. #include "unicode/utypes.h"
  14. #include "unicode/uregion.h"
  15. #if !UCONFIG_NO_FORMATTING
  16. #include "unicode/uobject.h"
  17. #include "unicode/uniset.h"
  18. #include "unicode/unistr.h"
  19. #include "unicode/strenum.h"
  20. U_NAMESPACE_BEGIN
  21. /**
  22. * <code>Region</code> is the class representing a Unicode Region Code, also known as a
  23. * Unicode Region Subtag, which is defined based upon the BCP 47 standard. We often think of
  24. * "regions" as "countries" when defining the characteristics of a locale. Region codes There are different
  25. * types of region codes that are important to distinguish.
  26. * <p>
  27. * Macroregion - A code for a "macro geographical (continental) region, geographical sub-region, or
  28. * selected economic and other grouping" as defined in
  29. * UN M.49 (http://unstats.un.org/unsd/methods/m49/m49regin.htm).
  30. * These are typically 3-digit codes, but contain some 2-letter codes, such as the LDML code QO
  31. * added for Outlying Oceania. Not all UNM.49 codes are defined in LDML, but most of them are.
  32. * Macroregions are represented in ICU by one of three region types: WORLD ( region code 001 ),
  33. * CONTINENTS ( regions contained directly by WORLD ), and SUBCONTINENTS ( things contained directly
  34. * by a continent ).
  35. * <p>
  36. * TERRITORY - A Region that is not a Macroregion. These are typically codes for countries, but also
  37. * include areas that are not separate countries, such as the code "AQ" for Antarctica or the code
  38. * "HK" for Hong Kong (SAR China). Overseas dependencies of countries may or may not have separate
  39. * codes. The codes are typically 2-letter codes aligned with the ISO 3166 standard, but BCP47 allows
  40. * for the use of 3-digit codes in the future.
  41. * <p>
  42. * UNKNOWN - The code ZZ is defined by Unicode LDML for use to indicate that the Region is unknown,
  43. * or that the value supplied as a region was invalid.
  44. * <p>
  45. * DEPRECATED - Region codes that have been defined in the past but are no longer in modern usage,
  46. * usually due to a country splitting into multiple territories or changing its name.
  47. * <p>
  48. * GROUPING - A widely understood grouping of territories that has a well defined membership such
  49. * that a region code has been assigned for it. Some of these are UNM.49 codes that do't fall into
  50. * the world/continent/sub-continent hierarchy, while others are just well known groupings that have
  51. * their own region code. Region "EU" (European Union) is one such region code that is a grouping.
  52. * Groupings will never be returned by the getContainingRegion() API, since a different type of region
  53. * ( WORLD, CONTINENT, or SUBCONTINENT ) will always be the containing region instead.
  54. *
  55. * The Region class is not intended for public subclassing.
  56. *
  57. * @author John Emmons
  58. * @stable ICU 51
  59. */
  60. class U_I18N_API Region : public UObject {
  61. public:
  62. /**
  63. * Destructor.
  64. * @stable ICU 51
  65. */
  66. virtual ~Region();
  67. /**
  68. * Returns true if the two regions are equal.
  69. * @stable ICU 51
  70. */
  71. UBool operator==(const Region &that) const;
  72. /**
  73. * Returns true if the two regions are NOT equal; that is, if operator ==() returns false.
  74. * @stable ICU 51
  75. */
  76. UBool operator!=(const Region &that) const;
  77. /**
  78. * Returns a pointer to a Region using the given region code. The region code can be either 2-letter ISO code,
  79. * 3-letter ISO code, UNM.49 numeric code, or other valid Unicode Region Code as defined by the LDML specification.
  80. * The identifier will be canonicalized internally using the supplemental metadata as defined in the CLDR.
  81. * If the region code is NULL or not recognized, the appropriate error code will be set ( U_ILLEGAL_ARGUMENT_ERROR )
  82. * @stable ICU 51
  83. */
  84. static const Region* U_EXPORT2 getInstance(const char *region_code, UErrorCode &status);
  85. /**
  86. * Returns a pointer to a Region using the given numeric region code. If the numeric region code is not recognized,
  87. * the appropriate error code will be set ( U_ILLEGAL_ARGUMENT_ERROR ).
  88. * @stable ICU 51
  89. */
  90. static const Region* U_EXPORT2 getInstance (int32_t code, UErrorCode &status);
  91. /**
  92. * Returns an enumeration over the IDs of all known regions that match the given type.
  93. * @stable ICU 55
  94. */
  95. static StringEnumeration* U_EXPORT2 getAvailable(URegionType type, UErrorCode &status);
  96. /**
  97. * Returns a pointer to the region that contains this region. Returns NULL if this region is code "001" (World)
  98. * or "ZZ" (Unknown region). For example, calling this method with region "IT" (Italy) returns the
  99. * region "039" (Southern Europe).
  100. * @stable ICU 51
  101. */
  102. const Region* getContainingRegion() const;
  103. /**
  104. * Return a pointer to the region that geographically contains this region and matches the given type,
  105. * moving multiple steps up the containment chain if necessary. Returns NULL if no containing region can be found
  106. * that matches the given type. Note: The URegionTypes = "URGN_GROUPING", "URGN_DEPRECATED", or "URGN_UNKNOWN"
  107. * are not appropriate for use in this API. NULL will be returned in this case. For example, calling this method
  108. * with region "IT" (Italy) for type "URGN_CONTINENT" returns the region "150" ( Europe ).
  109. * @stable ICU 51
  110. */
  111. const Region* getContainingRegion(URegionType type) const;
  112. /**
  113. * Return an enumeration over the IDs of all the regions that are immediate children of this region in the
  114. * region hierarchy. These returned regions could be either macro regions, territories, or a mixture of the two,
  115. * depending on the containment data as defined in CLDR. This API may return NULL if this region doesn't have
  116. * any sub-regions. For example, calling this method with region "150" (Europe) returns an enumeration containing
  117. * the various sub regions of Europe - "039" (Southern Europe) - "151" (Eastern Europe) - "154" (Northern Europe)
  118. * and "155" (Western Europe).
  119. * @stable ICU 55
  120. */
  121. StringEnumeration* getContainedRegions(UErrorCode &status) const;
  122. /**
  123. * Returns an enumeration over the IDs of all the regions that are children of this region anywhere in the region
  124. * hierarchy and match the given type. This API may return an empty enumeration if this region doesn't have any
  125. * sub-regions that match the given type. For example, calling this method with region "150" (Europe) and type
  126. * "URGN_TERRITORY" returns a set containing all the territories in Europe ( "FR" (France) - "IT" (Italy) - "DE" (Germany) etc. )
  127. * @stable ICU 55
  128. */
  129. StringEnumeration* getContainedRegions( URegionType type, UErrorCode &status ) const;
  130. /**
  131. * Returns true if this region contains the supplied other region anywhere in the region hierarchy.
  132. * @stable ICU 51
  133. */
  134. UBool contains(const Region &other) const;
  135. /**
  136. * For deprecated regions, return an enumeration over the IDs of the regions that are the preferred replacement
  137. * regions for this region. Returns null for a non-deprecated region. For example, calling this method with region
  138. * "SU" (Soviet Union) would return a list of the regions containing "RU" (Russia), "AM" (Armenia), "AZ" (Azerbaijan), etc...
  139. * @stable ICU 55
  140. */
  141. StringEnumeration* getPreferredValues(UErrorCode &status) const;
  142. /**
  143. * Return this region's canonical region code.
  144. * @stable ICU 51
  145. */
  146. const char* getRegionCode() const;
  147. /**
  148. * Return this region's numeric code.
  149. * Returns a negative value if the given region does not have a numeric code assigned to it.
  150. * @stable ICU 51
  151. */
  152. int32_t getNumericCode() const;
  153. /**
  154. * Returns the region type of this region.
  155. * @stable ICU 51
  156. */
  157. URegionType getType() const;
  158. #ifndef U_HIDE_INTERNAL_API
  159. /**
  160. * Cleans up statically allocated memory.
  161. * @internal
  162. */
  163. static void cleanupRegionData();
  164. #endif /* U_HIDE_INTERNAL_API */
  165. private:
  166. char id[4];
  167. UnicodeString idStr;
  168. int32_t code;
  169. URegionType type;
  170. Region *containingRegion;
  171. UVector *containedRegions;
  172. UVector *preferredValues;
  173. /**
  174. * Default Constructor. Internal - use factory methods only.
  175. */
  176. Region();
  177. /*
  178. * Initializes the region data from the ICU resource bundles. The region data
  179. * contains the basic relationships such as which regions are known, what the numeric
  180. * codes are, any known aliases, and the territory containment data.
  181. *
  182. * If the region data has already loaded, then this method simply returns without doing
  183. * anything meaningful.
  184. */
  185. static void loadRegionData(UErrorCode &status);
  186. };
  187. U_NAMESPACE_END
  188. #endif /* #if !UCONFIG_NO_FORMATTING */
  189. #endif // REGION_H
  190. //eof