| 1 | // © 2019 and later: Unicode, Inc. and others. |
| 2 | // License & terms of use: http://www.unicode.org/copyright.html#License |
| 3 | |
| 4 | // localeprioritylist.cpp |
| 5 | // created: 2019jul11 Markus W. Scherer |
| 6 | |
| 7 | #include "unicode/utypes.h" |
| 8 | #include "unicode/localpointer.h" |
| 9 | #include "unicode/locid.h" |
| 10 | #include "unicode/stringpiece.h" |
| 11 | #include "unicode/uobject.h" |
| 12 | #include "charstr.h" |
| 13 | #include "cmemory.h" |
| 14 | #include "localeprioritylist.h" |
| 15 | #include "uarrsort.h" |
| 16 | #include "uassert.h" |
| 17 | #include "uhash.h" |
| 18 | |
| 19 | U_NAMESPACE_BEGIN |
| 20 | |
| 21 | namespace { |
| 22 | |
| 23 | int32_t hashLocale(const UHashTok token) { |
| 24 | auto *locale = static_cast<const Locale *>(token.pointer); |
| 25 | return locale->hashCode(); |
| 26 | } |
| 27 | |
| 28 | UBool compareLocales(const UHashTok t1, const UHashTok t2) { |
| 29 | auto *l1 = static_cast<const Locale *>(t1.pointer); |
| 30 | auto *l2 = static_cast<const Locale *>(t2.pointer); |
| 31 | return *l1 == *l2; |
| 32 | } |
| 33 | |
| 34 | constexpr int32_t WEIGHT_ONE = 1000; |
| 35 | |
| 36 | struct LocaleAndWeight { |
| 37 | Locale *locale; |
| 38 | int32_t weight; // 0..1000 = 0.0..1.0 |
| 39 | int32_t index; // force stable sort |
| 40 | |
| 41 | int32_t compare(const LocaleAndWeight &other) const { |
| 42 | int32_t diff = other.weight - weight; // descending: other-this |
| 43 | if (diff != 0) { return diff; } |
| 44 | return index - other.index; |
| 45 | } |
| 46 | }; |
| 47 | |
| 48 | int32_t U_CALLCONV |
| 49 | compareLocaleAndWeight(const void * /*context*/, const void *left, const void *right) { |
| 50 | return static_cast<const LocaleAndWeight *>(left)-> |
| 51 | compare(*static_cast<const LocaleAndWeight *>(right)); |
| 52 | } |
| 53 | |
| 54 | const char *skipSpaces(const char *p, const char *limit) { |
| 55 | while (p < limit && *p == ' ') { ++p; } |
| 56 | return p; |
| 57 | } |
| 58 | |
| 59 | int32_t findTagLength(const char *p, const char *limit) { |
| 60 | // Look for accept-language delimiters. |
| 61 | // Leave other validation up to the Locale constructor. |
| 62 | const char *q; |
| 63 | for (q = p; q < limit; ++q) { |
| 64 | char c = *q; |
| 65 | if (c == ' ' || c == ',' || c == ';') { break; } |
| 66 | } |
| 67 | return static_cast<int32_t>(q - p); |
| 68 | } |
| 69 | |
| 70 | /** |
| 71 | * Parses and returns a qvalue weight in millis. |
| 72 | * Advances p to after the parsed substring. |
| 73 | * Returns a negative value if parsing fails. |
| 74 | */ |
| 75 | int32_t parseWeight(const char *&p, const char *limit) { |
| 76 | p = skipSpaces(p, limit); |
| 77 | char c; |
| 78 | if (p == limit || ((c = *p) != '0' && c != '1')) { return -1; } |
| 79 | int32_t weight = (c - '0') * 1000; |
| 80 | if (++p == limit || *p != '.') { return weight; } |
| 81 | int32_t multiplier = 100; |
| 82 | while (++p != limit && '0' <= (c = *p) && c <= '9') { |
| 83 | c -= '0'; |
| 84 | if (multiplier > 0) { |
| 85 | weight += c * multiplier; |
| 86 | multiplier /= 10; |
| 87 | } else if (multiplier == 0) { |
| 88 | // round up |
| 89 | if (c >= 5) { ++weight; } |
| 90 | multiplier = -1; |
| 91 | } // else ignore further fraction digits |
| 92 | } |
| 93 | return weight <= WEIGHT_ONE ? weight : -1; // bad if > 1.0 |
| 94 | } |
| 95 | |
| 96 | } // namespace |
| 97 | |
| 98 | /** |
| 99 | * Nothing but a wrapper over a MaybeStackArray of LocaleAndWeight. |
| 100 | * |
| 101 | * This wrapper exists (and is not in an anonymous namespace) |
| 102 | * so that we can forward-declare it in the header file and |
| 103 | * don't have to expose the MaybeStackArray specialization and |
| 104 | * the LocaleAndWeight to code (like the test) that #includes localeprioritylist.h. |
| 105 | * Also, otherwise we would have to do a platform-specific |
| 106 | * template export declaration of some kind for the MaybeStackArray specialization |
| 107 | * to be properly exported from the common DLL. |
| 108 | */ |
| 109 | struct LocaleAndWeightArray : public UMemory { |
| 110 | MaybeStackArray<LocaleAndWeight, 20> array; |
| 111 | }; |
| 112 | |
| 113 | LocalePriorityList::LocalePriorityList(StringPiece s, UErrorCode &errorCode) { |
| 114 | if (U_FAILURE(errorCode)) { return; } |
| 115 | list = new LocaleAndWeightArray(); |
| 116 | if (list == nullptr) { |
| 117 | errorCode = U_MEMORY_ALLOCATION_ERROR; |
| 118 | return; |
| 119 | } |
| 120 | const char *p = s.data(); |
| 121 | const char *limit = p + s.length(); |
| 122 | while ((p = skipSpaces(p, limit)) != limit) { |
| 123 | if (*p == ',') { // empty range field |
| 124 | ++p; |
| 125 | continue; |
| 126 | } |
| 127 | int32_t tagLength = findTagLength(p, limit); |
| 128 | if (tagLength == 0) { |
| 129 | errorCode = U_ILLEGAL_ARGUMENT_ERROR; |
| 130 | return; |
| 131 | } |
| 132 | CharString tag(p, tagLength, errorCode); |
| 133 | if (U_FAILURE(errorCode)) { return; } |
| 134 | Locale locale = Locale(tag.data()); |
| 135 | if (locale.isBogus()) { |
| 136 | errorCode = U_ILLEGAL_ARGUMENT_ERROR; |
| 137 | return; |
| 138 | } |
| 139 | int32_t weight = WEIGHT_ONE; |
| 140 | if ((p = skipSpaces(p + tagLength, limit)) != limit && *p == ';') { |
| 141 | if ((p = skipSpaces(p + 1, limit)) == limit || *p != 'q' || |
| 142 | (p = skipSpaces(p + 1, limit)) == limit || *p != '=' || |
| 143 | (++p, (weight = parseWeight(p, limit)) < 0)) { |
| 144 | errorCode = U_ILLEGAL_ARGUMENT_ERROR; |
| 145 | return; |
| 146 | } |
| 147 | p = skipSpaces(p, limit); |
| 148 | } |
| 149 | if (p != limit && *p != ',') { // trailing junk |
| 150 | errorCode = U_ILLEGAL_ARGUMENT_ERROR; |
| 151 | return; |
| 152 | } |
| 153 | add(locale, weight, errorCode); |
| 154 | if (p == limit) { break; } |
| 155 | ++p; |
| 156 | } |
| 157 | sort(errorCode); |
| 158 | } |
| 159 | |
| 160 | LocalePriorityList::~LocalePriorityList() { |
| 161 | if (list != nullptr) { |
| 162 | for (int32_t i = 0; i < listLength; ++i) { |
| 163 | delete list->array[i].locale; |
| 164 | } |
| 165 | delete list; |
| 166 | } |
| 167 | uhash_close(map); |
| 168 | } |
| 169 | |
| 170 | const Locale *LocalePriorityList::localeAt(int32_t i) const { |
| 171 | return list->array[i].locale; |
| 172 | } |
| 173 | |
| 174 | Locale *LocalePriorityList::orphanLocaleAt(int32_t i) { |
| 175 | if (list == nullptr) { return nullptr; } |
| 176 | LocaleAndWeight &lw = list->array[i]; |
| 177 | Locale *l = lw.locale; |
| 178 | lw.locale = nullptr; |
| 179 | return l; |
| 180 | } |
| 181 | |
| 182 | bool LocalePriorityList::add(const Locale &locale, int32_t weight, UErrorCode &errorCode) { |
| 183 | if (U_FAILURE(errorCode)) { return false; } |
| 184 | if (map == nullptr) { |
| 185 | if (weight <= 0) { return true; } // do not add q=0 |
| 186 | map = uhash_open(hashLocale, compareLocales, uhash_compareLong, &errorCode); |
| 187 | if (U_FAILURE(errorCode)) { return false; } |
| 188 | } |
| 189 | LocalPointer<Locale> clone; |
| 190 | int32_t index = uhash_geti(map, &locale); |
| 191 | if (index != 0) { |
| 192 | // Duplicate: Remove the old item and append it anew. |
| 193 | LocaleAndWeight &lw = list->array[index - 1]; |
| 194 | clone.adoptInstead(lw.locale); |
| 195 | lw.locale = nullptr; |
| 196 | lw.weight = 0; |
| 197 | ++numRemoved; |
| 198 | } |
| 199 | if (weight <= 0) { // do not add q=0 |
| 200 | if (index != 0) { |
| 201 | // Not strictly necessary but cleaner. |
| 202 | uhash_removei(map, &locale); |
| 203 | } |
| 204 | return true; |
| 205 | } |
| 206 | if (clone.isNull()) { |
| 207 | clone.adoptInstead(locale.clone()); |
| 208 | if (clone.isNull() || (clone->isBogus() && !locale.isBogus())) { |
| 209 | errorCode = U_MEMORY_ALLOCATION_ERROR; |
| 210 | return false; |
| 211 | } |
| 212 | } |
| 213 | if (listLength == list->array.getCapacity()) { |
| 214 | int32_t newCapacity = listLength < 50 ? 100 : 4 * listLength; |
| 215 | if (list->array.resize(newCapacity, listLength) == nullptr) { |
| 216 | errorCode = U_MEMORY_ALLOCATION_ERROR; |
| 217 | return false; |
| 218 | } |
| 219 | } |
| 220 | uhash_puti(map, clone.getAlias(), listLength + 1, &errorCode); |
| 221 | if (U_FAILURE(errorCode)) { return false; } |
| 222 | LocaleAndWeight &lw = list->array[listLength]; |
| 223 | lw.locale = clone.orphan(); |
| 224 | lw.weight = weight; |
| 225 | lw.index = listLength++; |
| 226 | if (weight < WEIGHT_ONE) { hasWeights = true; } |
| 227 | U_ASSERT(uhash_count(map) == getLength()); |
| 228 | return true; |
| 229 | } |
| 230 | |
| 231 | void LocalePriorityList::sort(UErrorCode &errorCode) { |
| 232 | // Sort by descending weights if there is a mix of weights. |
| 233 | // The comparator forces a stable sort via the item index. |
| 234 | if (U_FAILURE(errorCode) || getLength() <= 1 || !hasWeights) { return; } |
| 235 | uprv_sortArray(list->array.getAlias(), listLength, sizeof(LocaleAndWeight), |
| 236 | compareLocaleAndWeight, nullptr, FALSE, &errorCode); |
| 237 | } |
| 238 | |
| 239 | U_NAMESPACE_END |
| 240 | |