| 1 | // © 2016 and later: Unicode, Inc. and others. |
| 2 | // License & terms of use: http://www.unicode.org/copyright.html |
| 3 | /* |
| 4 | ******************************************************************************* |
| 5 | * Copyright (C) 2014-2016, International Business Machines Corporation and others. |
| 6 | * All Rights Reserved. |
| 7 | ******************************************************************************* |
| 8 | */ |
| 9 | |
| 10 | #ifndef REGION_H |
| 11 | #define REGION_H |
| 12 | |
| 13 | /** |
| 14 | * \file |
| 15 | * \brief C++ API: Region classes (territory containment) |
| 16 | */ |
| 17 | |
| 18 | #include "unicode/utypes.h" |
| 19 | |
| 20 | #if U_SHOW_CPLUSPLUS_API |
| 21 | |
| 22 | #if !UCONFIG_NO_FORMATTING |
| 23 | |
| 24 | #include "unicode/uregion.h" |
| 25 | #include "unicode/uobject.h" |
| 26 | #include "unicode/uniset.h" |
| 27 | #include "unicode/unistr.h" |
| 28 | #include "unicode/strenum.h" |
| 29 | |
| 30 | U_NAMESPACE_BEGIN |
| 31 | |
| 32 | /** |
| 33 | * <code>Region</code> is the class representing a Unicode Region Code, also known as a |
| 34 | * Unicode Region Subtag, which is defined based upon the BCP 47 standard. We often think of |
| 35 | * "regions" as "countries" when defining the characteristics of a locale. Region codes There are different |
| 36 | * types of region codes that are important to distinguish. |
| 37 | * <p> |
| 38 | * Macroregion - A code for a "macro geographical (continental) region, geographical sub-region, or |
| 39 | * selected economic and other grouping" as defined in |
| 40 | * UN M.49 (http://unstats.un.org/unsd/methods/m49/m49regin.htm). |
| 41 | * These are typically 3-digit codes, but contain some 2-letter codes, such as the LDML code QO |
| 42 | * added for Outlying Oceania. Not all UNM.49 codes are defined in LDML, but most of them are. |
| 43 | * Macroregions are represented in ICU by one of three region types: WORLD ( region code 001 ), |
| 44 | * CONTINENTS ( regions contained directly by WORLD ), and SUBCONTINENTS ( things contained directly |
| 45 | * by a continent ). |
| 46 | * <p> |
| 47 | * TERRITORY - A Region that is not a Macroregion. These are typically codes for countries, but also |
| 48 | * include areas that are not separate countries, such as the code "AQ" for Antarctica or the code |
| 49 | * "HK" for Hong Kong (SAR China). Overseas dependencies of countries may or may not have separate |
| 50 | * codes. The codes are typically 2-letter codes aligned with the ISO 3166 standard, but BCP47 allows |
| 51 | * for the use of 3-digit codes in the future. |
| 52 | * <p> |
| 53 | * UNKNOWN - The code ZZ is defined by Unicode LDML for use to indicate that the Region is unknown, |
| 54 | * or that the value supplied as a region was invalid. |
| 55 | * <p> |
| 56 | * DEPRECATED - Region codes that have been defined in the past but are no longer in modern usage, |
| 57 | * usually due to a country splitting into multiple territories or changing its name. |
| 58 | * <p> |
| 59 | * GROUPING - A widely understood grouping of territories that has a well defined membership such |
| 60 | * that a region code has been assigned for it. Some of these are UNM.49 codes that do't fall into |
| 61 | * the world/continent/sub-continent hierarchy, while others are just well known groupings that have |
| 62 | * their own region code. Region "EU" (European Union) is one such region code that is a grouping. |
| 63 | * Groupings will never be returned by the getContainingRegion() API, since a different type of region |
| 64 | * ( WORLD, CONTINENT, or SUBCONTINENT ) will always be the containing region instead. |
| 65 | * |
| 66 | * The Region class is not intended for public subclassing. |
| 67 | * |
| 68 | * @author John Emmons |
| 69 | * @stable ICU 51 |
| 70 | */ |
| 71 | |
| 72 | class U_I18N_API Region : public UObject { |
| 73 | public: |
| 74 | /** |
| 75 | * Destructor. |
| 76 | * @stable ICU 51 |
| 77 | */ |
| 78 | virtual ~Region(); |
| 79 | |
| 80 | /** |
| 81 | * Returns true if the two regions are equal. |
| 82 | * @stable ICU 51 |
| 83 | */ |
| 84 | UBool operator==(const Region &that) const; |
| 85 | |
| 86 | /** |
| 87 | * Returns true if the two regions are NOT equal; that is, if operator ==() returns false. |
| 88 | * @stable ICU 51 |
| 89 | */ |
| 90 | UBool operator!=(const Region &that) const; |
| 91 | |
| 92 | /** |
| 93 | * Returns a pointer to a Region using the given region code. The region code can be either 2-letter ISO code, |
| 94 | * 3-letter ISO code, UNM.49 numeric code, or other valid Unicode Region Code as defined by the LDML specification. |
| 95 | * The identifier will be canonicalized internally using the supplemental metadata as defined in the CLDR. |
| 96 | * If the region code is NULL or not recognized, the appropriate error code will be set ( U_ILLEGAL_ARGUMENT_ERROR ) |
| 97 | * @stable ICU 51 |
| 98 | */ |
| 99 | static const Region* U_EXPORT2 getInstance(const char *region_code, UErrorCode &status); |
| 100 | |
| 101 | /** |
| 102 | * Returns a pointer to a Region using the given numeric region code. If the numeric region code is not recognized, |
| 103 | * the appropriate error code will be set ( U_ILLEGAL_ARGUMENT_ERROR ). |
| 104 | * @stable ICU 51 |
| 105 | */ |
| 106 | static const Region* U_EXPORT2 getInstance (int32_t code, UErrorCode &status); |
| 107 | |
| 108 | /** |
| 109 | * Returns an enumeration over the IDs of all known regions that match the given type. |
| 110 | * @stable ICU 55 |
| 111 | */ |
| 112 | static StringEnumeration* U_EXPORT2 getAvailable(URegionType type, UErrorCode &status); |
| 113 | |
| 114 | /** |
| 115 | * Returns a pointer to the region that contains this region. Returns NULL if this region is code "001" (World) |
| 116 | * or "ZZ" (Unknown region). For example, calling this method with region "IT" (Italy) returns the |
| 117 | * region "039" (Southern Europe). |
| 118 | * @stable ICU 51 |
| 119 | */ |
| 120 | const Region* getContainingRegion() const; |
| 121 | |
| 122 | /** |
| 123 | * Return a pointer to the region that geographically contains this region and matches the given type, |
| 124 | * moving multiple steps up the containment chain if necessary. Returns NULL if no containing region can be found |
| 125 | * that matches the given type. Note: The URegionTypes = "URGN_GROUPING", "URGN_DEPRECATED", or "URGN_UNKNOWN" |
| 126 | * are not appropriate for use in this API. NULL will be returned in this case. For example, calling this method |
| 127 | * with region "IT" (Italy) for type "URGN_CONTINENT" returns the region "150" ( Europe ). |
| 128 | * @stable ICU 51 |
| 129 | */ |
| 130 | const Region* getContainingRegion(URegionType type) const; |
| 131 | |
| 132 | /** |
| 133 | * Return an enumeration over the IDs of all the regions that are immediate children of this region in the |
| 134 | * region hierarchy. These returned regions could be either macro regions, territories, or a mixture of the two, |
| 135 | * depending on the containment data as defined in CLDR. This API may return NULL if this region doesn't have |
| 136 | * any sub-regions. For example, calling this method with region "150" (Europe) returns an enumeration containing |
| 137 | * the various sub regions of Europe - "039" (Southern Europe) - "151" (Eastern Europe) - "154" (Northern Europe) |
| 138 | * and "155" (Western Europe). |
| 139 | * @stable ICU 55 |
| 140 | */ |
| 141 | StringEnumeration* getContainedRegions(UErrorCode &status) const; |
| 142 | |
| 143 | /** |
| 144 | * Returns an enumeration over the IDs of all the regions that are children of this region anywhere in the region |
| 145 | * hierarchy and match the given type. This API may return an empty enumeration if this region doesn't have any |
| 146 | * sub-regions that match the given type. For example, calling this method with region "150" (Europe) and type |
| 147 | * "URGN_TERRITORY" returns a set containing all the territories in Europe ( "FR" (France) - "IT" (Italy) - "DE" (Germany) etc. ) |
| 148 | * @stable ICU 55 |
| 149 | */ |
| 150 | StringEnumeration* getContainedRegions( URegionType type, UErrorCode &status ) const; |
| 151 | |
| 152 | /** |
| 153 | * Returns true if this region contains the supplied other region anywhere in the region hierarchy. |
| 154 | * @stable ICU 51 |
| 155 | */ |
| 156 | UBool contains(const Region &other) const; |
| 157 | |
| 158 | /** |
| 159 | * For deprecated regions, return an enumeration over the IDs of the regions that are the preferred replacement |
| 160 | * regions for this region. Returns null for a non-deprecated region. For example, calling this method with region |
| 161 | * "SU" (Soviet Union) would return a list of the regions containing "RU" (Russia), "AM" (Armenia), "AZ" (Azerbaijan), etc... |
| 162 | * @stable ICU 55 |
| 163 | */ |
| 164 | StringEnumeration* getPreferredValues(UErrorCode &status) const; |
| 165 | |
| 166 | /** |
| 167 | * Return this region's canonical region code. |
| 168 | * @stable ICU 51 |
| 169 | */ |
| 170 | const char* getRegionCode() const; |
| 171 | |
| 172 | /** |
| 173 | * Return this region's numeric code. |
| 174 | * Returns a negative value if the given region does not have a numeric code assigned to it. |
| 175 | * @stable ICU 51 |
| 176 | */ |
| 177 | int32_t getNumericCode() const; |
| 178 | |
| 179 | /** |
| 180 | * Returns the region type of this region. |
| 181 | * @stable ICU 51 |
| 182 | */ |
| 183 | URegionType getType() const; |
| 184 | |
| 185 | #ifndef U_HIDE_INTERNAL_API |
| 186 | /** |
| 187 | * Cleans up statically allocated memory. |
| 188 | * @internal |
| 189 | */ |
| 190 | static void cleanupRegionData(); |
| 191 | #endif /* U_HIDE_INTERNAL_API */ |
| 192 | |
| 193 | private: |
| 194 | char id[4]; |
| 195 | UnicodeString idStr; |
| 196 | int32_t code; |
| 197 | URegionType fType; |
| 198 | Region *containingRegion; |
| 199 | UVector *containedRegions; |
| 200 | UVector *preferredValues; |
| 201 | |
| 202 | /** |
| 203 | * Default Constructor. Internal - use factory methods only. |
| 204 | */ |
| 205 | Region(); |
| 206 | |
| 207 | |
| 208 | /* |
| 209 | * Initializes the region data from the ICU resource bundles. The region data |
| 210 | * contains the basic relationships such as which regions are known, what the numeric |
| 211 | * codes are, any known aliases, and the territory containment data. |
| 212 | * |
| 213 | * If the region data has already loaded, then this method simply returns without doing |
| 214 | * anything meaningful. |
| 215 | */ |
| 216 | |
| 217 | static void U_CALLCONV loadRegionData(UErrorCode &status); |
| 218 | |
| 219 | }; |
| 220 | |
| 221 | U_NAMESPACE_END |
| 222 | |
| 223 | #endif /* #if !UCONFIG_NO_FORMATTING */ |
| 224 | |
| 225 | #endif /* U_SHOW_CPLUSPLUS_API */ |
| 226 | |
| 227 | #endif // REGION_H |
| 228 | |
| 229 | //eof |
| 230 | |