Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 1 | /* |
| 2 | * Copyright (C) 2015 The Android Open Source Project |
| 3 | * |
| 4 | * Licensed under the Apache License, Version 2.0 (the "License"); |
| 5 | * you may not use this file except in compliance with the License. |
| 6 | * You may obtain a copy of the License at |
| 7 | * |
| 8 | * http://www.apache.org/licenses/LICENSE-2.0 |
| 9 | * |
| 10 | * Unless required by applicable law or agreed to in writing, software |
| 11 | * distributed under the License is distributed on an "AS IS" BASIS, |
| 12 | * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. |
| 13 | * See the License for the specific language governing permissions and |
| 14 | * limitations under the License. |
| 15 | */ |
| 16 | |
Mårten Kongstad | e0930d3 | 2018-10-18 14:50:15 +0200 | [diff] [blame] | 17 | #include "android-base/macros.h" |
Mårten Kongstad | 24c9aa6 | 2018-06-20 08:46:41 +0200 | [diff] [blame] | 18 | #include "androidfw/Locale.h" |
| 19 | #include "androidfw/Util.h" |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 20 | |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 21 | #include <ctype.h> |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 22 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 23 | #include <algorithm> |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 24 | #include <string> |
| 25 | #include <vector> |
| 26 | |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 27 | using ::android::ResTable_config; |
| 28 | using ::android::StringPiece; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 29 | |
Mårten Kongstad | 24c9aa6 | 2018-06-20 08:46:41 +0200 | [diff] [blame] | 30 | namespace android { |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 31 | |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 32 | template <size_t N, class Transformer> |
| 33 | static void safe_transform_copy(const char* source, char (&dest)[N], Transformer t) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 34 | size_t i = 0; |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 35 | while (i < N && (*source) != '\0') { |
| 36 | dest[i++] = t(i, *source); |
| 37 | source++; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 38 | } |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 39 | while (i < N) { |
| 40 | dest[i++] = '\0'; |
| 41 | } |
| 42 | } |
| 43 | |
| 44 | void LocaleValue::set_language(const char* language_chars) { |
| 45 | safe_transform_copy(language_chars, language, [](size_t, char c) { return ::tolower(c); }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 46 | } |
| 47 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 48 | void LocaleValue::set_region(const char* region_chars) { |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 49 | safe_transform_copy(region_chars, region, [](size_t, char c) { return ::toupper(c); }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 50 | } |
| 51 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 52 | void LocaleValue::set_script(const char* script_chars) { |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 53 | safe_transform_copy(script_chars, script, |
| 54 | [](size_t i, char c) { return i ? ::tolower(c) : ::toupper(c); }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 55 | } |
| 56 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 57 | void LocaleValue::set_variant(const char* variant_chars) { |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 58 | safe_transform_copy(variant_chars, variant, [](size_t, char c) { return c; }); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 59 | } |
| 60 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 61 | static inline bool is_alpha(const std::string& str) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 62 | return std::all_of(std::begin(str), std::end(str), ::isalpha); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 63 | } |
| 64 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 65 | static inline bool is_number(const std::string& str) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 66 | return std::all_of(std::begin(str), std::end(str), ::isdigit); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 67 | } |
| 68 | |
Yurii Zubrytskyi | a577514 | 2022-11-02 17:49:49 -0700 | [diff] [blame] | 69 | bool LocaleValue::InitFromFilterString(StringPiece str) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 70 | // A locale (as specified in the filter) is an underscore separated name such |
| 71 | // as "en_US", "en_Latn_US", or "en_US_POSIX". |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 72 | std::vector<std::string> parts = util::SplitAndLowercase(str, '_'); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 73 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 74 | const int num_tags = parts.size(); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 75 | bool valid = false; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 76 | if (num_tags >= 1) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 77 | const std::string& lang = parts[0]; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 78 | if (is_alpha(lang) && (lang.length() == 2 || lang.length() == 3)) { |
| 79 | set_language(lang.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 80 | valid = true; |
| 81 | } |
| 82 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 83 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 84 | if (!valid || num_tags == 1) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 85 | return valid; |
| 86 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 87 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 88 | // At this point, valid == true && numTags > 1. |
| 89 | const std::string& part2 = parts[1]; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 90 | if ((part2.length() == 2 && is_alpha(part2)) || |
| 91 | (part2.length() == 3 && is_number(part2))) { |
| 92 | set_region(part2.c_str()); |
| 93 | } else if (part2.length() == 4 && is_alpha(part2)) { |
| 94 | set_script(part2.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 95 | } else if (part2.length() >= 4 && part2.length() <= 8) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 96 | set_variant(part2.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 97 | } else { |
| 98 | valid = false; |
| 99 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 100 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 101 | if (!valid || num_tags == 2) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 102 | return valid; |
| 103 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 104 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 105 | // At this point, valid == true && numTags > 1. |
| 106 | const std::string& part3 = parts[2]; |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 107 | if (((part3.length() == 2 && is_alpha(part3)) || |
| 108 | (part3.length() == 3 && is_number(part3))) && |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 109 | script[0]) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 110 | set_region(part3.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 111 | } else if (part3.length() >= 4 && part3.length() <= 8) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 112 | set_variant(part3.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 113 | } else { |
| 114 | valid = false; |
| 115 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 116 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 117 | if (!valid || num_tags == 3) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 118 | return valid; |
| 119 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 120 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 121 | const std::string& part4 = parts[3]; |
| 122 | if (part4.length() >= 4 && part4.length() <= 8) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 123 | set_variant(part4.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 124 | } else { |
| 125 | valid = false; |
| 126 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 127 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 128 | if (!valid || num_tags > 4) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 129 | return false; |
| 130 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 131 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 132 | return true; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 133 | } |
| 134 | |
Yurii Zubrytskyi | a577514 | 2022-11-02 17:49:49 -0700 | [diff] [blame] | 135 | bool LocaleValue::InitFromBcp47Tag(StringPiece bcp47tag) { |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 136 | return InitFromBcp47TagImpl(bcp47tag, '-'); |
| 137 | } |
| 138 | |
Yurii Zubrytskyi | a577514 | 2022-11-02 17:49:49 -0700 | [diff] [blame] | 139 | bool LocaleValue::InitFromBcp47TagImpl(StringPiece bcp47tag, const char separator) { |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 140 | std::vector<std::string> subtags = util::SplitAndLowercase(bcp47tag, separator); |
| 141 | if (subtags.size() == 1) { |
| 142 | set_language(subtags[0].c_str()); |
| 143 | } else if (subtags.size() == 2) { |
| 144 | set_language(subtags[0].c_str()); |
| 145 | |
| 146 | // The second tag can either be a region, a variant or a script. |
| 147 | switch (subtags[1].size()) { |
| 148 | case 2: |
| 149 | case 3: |
| 150 | set_region(subtags[1].c_str()); |
| 151 | break; |
| 152 | case 4: |
| 153 | if ('0' <= subtags[1][0] && subtags[1][0] <= '9') { |
| 154 | // This is a variant: fall through |
| 155 | } else { |
| 156 | set_script(subtags[1].c_str()); |
| 157 | break; |
| 158 | } |
Mårten Kongstad | e0930d3 | 2018-10-18 14:50:15 +0200 | [diff] [blame] | 159 | FALLTHROUGH_INTENDED; |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 160 | case 5: |
| 161 | case 6: |
| 162 | case 7: |
| 163 | case 8: |
| 164 | set_variant(subtags[1].c_str()); |
| 165 | break; |
| 166 | default: |
| 167 | return false; |
| 168 | } |
| 169 | } else if (subtags.size() == 3) { |
| 170 | // The language is always the first subtag. |
| 171 | set_language(subtags[0].c_str()); |
| 172 | |
| 173 | // The second subtag can either be a script or a region code. |
| 174 | // If its size is 4, it's a script code, else it's a region code. |
| 175 | if (subtags[1].size() == 4) { |
| 176 | set_script(subtags[1].c_str()); |
| 177 | } else if (subtags[1].size() == 2 || subtags[1].size() == 3) { |
| 178 | set_region(subtags[1].c_str()); |
| 179 | } else { |
| 180 | return false; |
| 181 | } |
| 182 | |
| 183 | // The third tag can either be a region code (if the second tag was |
| 184 | // a script), else a variant code. |
| 185 | if (subtags[2].size() >= 4) { |
| 186 | set_variant(subtags[2].c_str()); |
| 187 | } else { |
| 188 | set_region(subtags[2].c_str()); |
| 189 | } |
| 190 | } else if (subtags.size() == 4) { |
| 191 | set_language(subtags[0].c_str()); |
| 192 | set_script(subtags[1].c_str()); |
| 193 | set_region(subtags[2].c_str()); |
| 194 | set_variant(subtags[3].c_str()); |
| 195 | } else { |
| 196 | return false; |
| 197 | } |
| 198 | return true; |
| 199 | } |
| 200 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 201 | ssize_t LocaleValue::InitFromParts(std::vector<std::string>::iterator iter, |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 202 | std::vector<std::string>::iterator end) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 203 | const std::vector<std::string>::iterator start_iter = iter; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 204 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 205 | std::string& part = *iter; |
| 206 | if (part[0] == 'b' && part[1] == '+') { |
| 207 | // This is a "modified" BCP 47 language tag. Same semantics as BCP 47 tags, |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 208 | // except that the separator is "+" and not "-". Skip the prefix 'b+'. |
| 209 | if (!InitFromBcp47TagImpl(StringPiece(part).substr(2), '+')) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 210 | return -1; |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 211 | } |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 212 | ++iter; |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 213 | } else { |
Adam Lesinski | b58c3ef | 2017-09-12 17:39:52 -0700 | [diff] [blame] | 214 | if ((part.length() == 2 || part.length() == 3) && is_alpha(part) && part != "car") { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 215 | set_language(part.c_str()); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 216 | ++iter; |
| 217 | |
| 218 | if (iter != end) { |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 219 | const std::string& region_part = *iter; |
| 220 | if (region_part.c_str()[0] == 'r' && region_part.length() == 3) { |
| 221 | set_region(region_part.c_str() + 1); |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 222 | ++iter; |
| 223 | } |
| 224 | } |
| 225 | } |
| 226 | } |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 227 | return static_cast<ssize_t>(iter - start_iter); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 228 | } |
| 229 | |
Yurii Zubrytskyi | d375260 | 2021-12-01 09:11:46 -0800 | [diff] [blame] | 230 | // Make sure the following memcpy's are properly sized. |
| 231 | static_assert(sizeof(ResTable_config::localeScript) == sizeof(LocaleValue::script)); |
| 232 | static_assert(sizeof(ResTable_config::localeVariant) == sizeof(LocaleValue::variant)); |
| 233 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 234 | void LocaleValue::InitFromResTable(const ResTable_config& config) { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 235 | config.unpackLanguage(language); |
| 236 | config.unpackRegion(region); |
| 237 | if (config.localeScript[0] && !config.localeScriptWasComputed) { |
| 238 | memcpy(script, config.localeScript, sizeof(config.localeScript)); |
| 239 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 240 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 241 | if (config.localeVariant[0]) { |
| 242 | memcpy(variant, config.localeVariant, sizeof(config.localeVariant)); |
| 243 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 244 | } |
| 245 | |
Adam Lesinski | ce5e56e | 2016-10-21 17:56:45 -0700 | [diff] [blame] | 246 | void LocaleValue::WriteTo(ResTable_config* out) const { |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 247 | out->packLanguage(language); |
| 248 | out->packRegion(region); |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 249 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 250 | if (script[0]) { |
| 251 | memcpy(out->localeScript, script, sizeof(out->localeScript)); |
| 252 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 253 | |
Adam Lesinski | cacb28f | 2016-10-19 12:18:14 -0700 | [diff] [blame] | 254 | if (variant[0]) { |
| 255 | memcpy(out->localeVariant, variant, sizeof(out->localeVariant)); |
| 256 | } |
Adam Lesinski | 6f6ceb7 | 2014-11-14 14:48:12 -0800 | [diff] [blame] | 257 | } |
| 258 | |
Mårten Kongstad | 24c9aa6 | 2018-06-20 08:46:41 +0200 | [diff] [blame] | 259 | } // namespace android |