uregion.h 9.6 KB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248
  1. /*
  2. *****************************************************************************************
  3. * Copyright (C) 2014, International Business Machines
  4. * Corporation and others. All Rights Reserved.
  5. *****************************************************************************************
  6. */
  7. #ifndef UREGION_H
  8. #define UREGION_H
  9. #include "unicode/utypes.h"
  10. #include "unicode/uenum.h"
  11. /**
  12. * \file
  13. * \brief C API: URegion (territory containment and mapping)
  14. *
  15. * URegion objects represent data associated with a particular Unicode Region Code, also known as a
  16. * Unicode Region Subtag, which is defined based upon the BCP 47 standard. These include:
  17. * * Two-letter codes defined by ISO 3166-1, with special LDML treatment of certain private-use or
  18. * reserved codes;
  19. * * A subset of 3-digit numeric codes defined by UN M.49.
  20. * URegion objects can also provide mappings to and from additional codes. There are different types
  21. * of regions that are important to distinguish:
  22. * <p>
  23. * Macroregion - A code for a "macro geographical (continental) region, geographical sub-region, or
  24. * selected economic and other grouping" as defined in UN M.49. These are typically 3-digit codes,
  25. * but contain some 2-letter codes for LDML extensions, such as "QO" for Outlying Oceania.
  26. * Macroregions are represented in ICU by one of three region types: WORLD (code 001),
  27. * CONTINENTS (regions contained directly by WORLD), and SUBCONTINENTS (regions contained directly
  28. * by a continent ).
  29. * <p>
  30. * TERRITORY - A Region that is not a Macroregion. These are typically codes for countries, but also
  31. * include areas that are not separate countries, such as the code "AQ" for Antarctica or the code
  32. * "HK" for Hong Kong (SAR China). Overseas dependencies of countries may or may not have separate
  33. * codes. The codes are typically 2-letter codes aligned with ISO 3166, but BCP47 allows for the use
  34. * of 3-digit codes in the future.
  35. * <p>
  36. * UNKNOWN - The code ZZ is defined by Unicode LDML for use in indicating that region is unknown,
  37. * or that the value supplied as a region was invalid.
  38. * <p>
  39. * DEPRECATED - Region codes that have been defined in the past but are no longer in modern usage,
  40. * usually due to a country splitting into multiple territories or changing its name.
  41. * <p>
  42. * GROUPING - A widely understood grouping of territories that has a well defined membership such
  43. * that a region code has been assigned for it. Some of these are UN M.49 codes that don't fall into
  44. * the world/continent/sub-continent hierarchy, while others are just well-known groupings that have
  45. * their own region code. Region "EU" (European Union) is one such region code that is a grouping.
  46. * Groupings will never be returned by the uregion_getContainingRegion, since a different type of region
  47. * (WORLD, CONTINENT, or SUBCONTINENT) will always be the containing region instead.
  48. *
  49. * URegion objects are const/immutable, owned and maintained by ICU itself, so there are not functions
  50. * to open or close them.
  51. */
  52. /**
  53. * URegionType is an enumeration defining the different types of regions. Current possible
  54. * values are URGN_WORLD, URGN_CONTINENT, URGN_SUBCONTINENT, URGN_TERRITORY, URGN_GROUPING,
  55. * URGN_DEPRECATED, and URGN_UNKNOWN.
  56. *
  57. * @stable ICU 51
  58. */
  59. typedef enum URegionType {
  60. /**
  61. * Type representing the unknown region.
  62. * @stable ICU 51
  63. */
  64. URGN_UNKNOWN,
  65. /**
  66. * Type representing a territory.
  67. * @stable ICU 51
  68. */
  69. URGN_TERRITORY,
  70. /**
  71. * Type representing the whole world.
  72. * @stable ICU 51
  73. */
  74. URGN_WORLD,
  75. /**
  76. * Type representing a continent.
  77. * @stable ICU 51
  78. */
  79. URGN_CONTINENT,
  80. /**
  81. * Type representing a sub-continent.
  82. * @stable ICU 51
  83. */
  84. URGN_SUBCONTINENT,
  85. /**
  86. * Type representing a grouping of territories that is not to be used in
  87. * the normal WORLD/CONTINENT/SUBCONTINENT/TERRITORY containment tree.
  88. * @stable ICU 51
  89. */
  90. URGN_GROUPING,
  91. /**
  92. * Type representing a region whose code has been deprecated, usually
  93. * due to a country splitting into multiple territories or changing its name.
  94. * @stable ICU 51
  95. */
  96. URGN_DEPRECATED,
  97. /**
  98. * Maximum value for this unumeration.
  99. * @stable ICU 51
  100. */
  101. URGN_LIMIT
  102. } URegionType;
  103. #if !UCONFIG_NO_FORMATTING
  104. /**
  105. * Opaque URegion object for use in C programs.
  106. * @stable ICU 52
  107. */
  108. struct URegion;
  109. typedef struct URegion URegion; /**< @stable ICU 52 */
  110. /**
  111. * Returns a pointer to a URegion for the specified region code: A 2-letter or 3-letter ISO 3166
  112. * code, UN M.49 numeric code (superset of ISO 3166 numeric codes), or other valid Unicode Region
  113. * Code as defined by the LDML specification. The code will be canonicalized internally. If the
  114. * region code is NULL or not recognized, the appropriate error code will be set
  115. * (U_ILLEGAL_ARGUMENT_ERROR).
  116. * @stable ICU 52
  117. */
  118. U_STABLE const URegion* U_EXPORT2
  119. uregion_getRegionFromCode(const char *regionCode, UErrorCode *status);
  120. /**
  121. * Returns a pointer to a URegion for the specified numeric region code. If the numeric region
  122. * code is not recognized, the appropriate error code will be set (U_ILLEGAL_ARGUMENT_ERROR).
  123. * @stable ICU 52
  124. */
  125. U_STABLE const URegion* U_EXPORT2
  126. uregion_getRegionFromNumericCode (int32_t code, UErrorCode *status);
  127. /**
  128. * Returns an enumeration over the canonical codes of all known regions that match the given type.
  129. * The enumeration must be closed with with uenum_close().
  130. * @stable ICU 52
  131. */
  132. U_STABLE UEnumeration* U_EXPORT2
  133. uregion_getAvailable(URegionType type, UErrorCode *status);
  134. /**
  135. * Returns true if the specified uregion is equal to the specified otherRegion.
  136. * @stable ICU 52
  137. */
  138. U_STABLE UBool U_EXPORT2
  139. uregion_areEqual(const URegion* uregion, const URegion* otherRegion);
  140. /**
  141. * Returns a pointer to the URegion that contains the specified uregion. Returns NULL if the
  142. * specified uregion is code "001" (World) or "ZZ" (Unknown region). For example, calling
  143. * this method with region "IT" (Italy) returns the URegion for "039" (Southern Europe).
  144. * @stable ICU 52
  145. */
  146. U_STABLE const URegion* U_EXPORT2
  147. uregion_getContainingRegion(const URegion* uregion);
  148. /**
  149. * Return a pointer to the URegion that geographically contains this uregion and matches the
  150. * specified type, moving multiple steps up the containment chain if necessary. Returns NULL if no
  151. * containing region can be found that matches the specified type. Will return NULL if URegionType
  152. * is URGN_GROUPING, URGN_DEPRECATED, or URGN_UNKNOWN which are not appropriate for this API.
  153. * For example, calling this method with uregion "IT" (Italy) for type URGN_CONTINENT returns the
  154. * URegion "150" (Europe).
  155. * @stable ICU 52
  156. */
  157. U_STABLE const URegion* U_EXPORT2
  158. uregion_getContainingRegionOfType(const URegion* uregion, URegionType type);
  159. /**
  160. * Return an enumeration over the canonical codes of all the regions that are immediate children
  161. * of the specified uregion in the region hierarchy. These returned regions could be either macro
  162. * regions, territories, or a mixture of the two, depending on the containment data as defined in
  163. * CLDR. This API returns NULL if this uregion doesn't have any sub-regions. For example, calling
  164. * this function for uregion "150" (Europe) returns an enumeration containing the various
  165. * sub-regions of Europe: "039" (Southern Europe), "151" (Eastern Europe), "154" (Northern Europe),
  166. * and "155" (Western Europe). The enumeration must be closed with with uenum_close().
  167. * @stable ICU 52
  168. */
  169. U_STABLE UEnumeration* U_EXPORT2
  170. uregion_getContainedRegions(const URegion* uregion, UErrorCode *status);
  171. /**
  172. * Returns an enumeration over the canonical codes of all the regions that are children of the
  173. * specified uregion anywhere in the region hierarchy and match the given type. This API may return
  174. * an empty enumeration if this uregion doesn't have any sub-regions that match the given type.
  175. * For example, calling this method with region "150" (Europe) and type URGN_TERRITORY" returns an
  176. * enumeration containing all the territories in Europe: "FR" (France), "IT" (Italy), "DE" (Germany),
  177. * etc. The enumeration must be closed with with uenum_close().
  178. * @stable ICU 52
  179. */
  180. U_STABLE UEnumeration* U_EXPORT2
  181. uregion_getContainedRegionsOfType(const URegion* uregion, URegionType type, UErrorCode *status);
  182. /**
  183. * Returns true if the specified uregion contains the specified otherRegion anywhere in the region
  184. * hierarchy.
  185. * @stable ICU 52
  186. */
  187. U_STABLE UBool U_EXPORT2
  188. uregion_contains(const URegion* uregion, const URegion* otherRegion);
  189. /**
  190. * If the specified uregion is deprecated, returns an enumeration over the canonical codes of the
  191. * regions that are the preferred replacement regions for the specified uregion. If the specified
  192. * uregion is not deprecated, returns NULL. For example, calling this method with uregion
  193. * "SU" (Soviet Union) returns a list of the regions containing "RU" (Russia), "AM" (Armenia),
  194. * "AZ" (Azerbaijan), etc... The enumeration must be closed with with uenum_close().
  195. * @stable ICU 52
  196. */
  197. U_STABLE UEnumeration* U_EXPORT2
  198. uregion_getPreferredValues(const URegion* uregion, UErrorCode *status);
  199. /**
  200. * Returns the specified uregion's canonical code.
  201. * @stable ICU 52
  202. */
  203. U_STABLE const char* U_EXPORT2
  204. uregion_getRegionCode(const URegion* uregion);
  205. /**
  206. * Returns the specified uregion's numeric code, or a negative value if there is no numeric code
  207. * for the specified uregion.
  208. * @stable ICU 52
  209. */
  210. U_STABLE int32_t U_EXPORT2
  211. uregion_getNumericCode(const URegion* uregion);
  212. /**
  213. * Returns the URegionType of the specified uregion.
  214. * @stable ICU 52
  215. */
  216. U_STABLE URegionType U_EXPORT2
  217. uregion_getType(const URegion* uregion);
  218. #endif /* #if !UCONFIG_NO_FORMATTING */
  219. #endif