gfx/skia/trunk/src/sfnt/SkOTTable_name.cpp

changeset 0
6474c204b198
     1.1 --- /dev/null	Thu Jan 01 00:00:00 1970 +0000
     1.2 +++ b/gfx/skia/trunk/src/sfnt/SkOTTable_name.cpp	Wed Dec 31 06:09:35 2014 +0100
     1.3 @@ -0,0 +1,534 @@
     1.4 +/*
     1.5 + * Copyright 2013 Google Inc.
     1.6 + *
     1.7 + * Use of this source code is governed by a BSD-style license that can be
     1.8 + * found in the LICENSE file.
     1.9 + */
    1.10 +
    1.11 +#include "SkOTTable_name.h"
    1.12 +
    1.13 +#include "SkEndian.h"
    1.14 +#include "SkString.h"
    1.15 +#include "SkTSearch.h"
    1.16 +#include "SkTemplates.h"
    1.17 +#include "SkUtils.h"
    1.18 +
    1.19 +static SkUnichar SkUTF16BE_NextUnichar(const uint16_t** srcPtr) {
    1.20 +    SkASSERT(srcPtr && *srcPtr);
    1.21 +
    1.22 +    const uint16_t* src = *srcPtr;
    1.23 +    SkUnichar c = SkEndian_SwapBE16(*src++);
    1.24 +
    1.25 +    SkASSERT(!SkUTF16_IsLowSurrogate(c));
    1.26 +    if (SkUTF16_IsHighSurrogate(c)) {
    1.27 +        unsigned c2 = SkEndian_SwapBE16(*src++);
    1.28 +        SkASSERT(SkUTF16_IsLowSurrogate(c2));
    1.29 +
    1.30 +        c = (c << 10) + c2 + (0x10000 - (0xD800 << 10) - 0xDC00);
    1.31 +    }
    1.32 +    *srcPtr = src;
    1.33 +    return c;
    1.34 +}
    1.35 +
    1.36 +static void SkStringFromUTF16BE(const uint16_t* utf16be, size_t length, SkString& utf8) {
    1.37 +    SkASSERT(utf16be != NULL);
    1.38 +
    1.39 +    utf8.reset();
    1.40 +    size_t numberOf16BitValues = length / 2;
    1.41 +    const uint16_t* end = utf16be + numberOf16BitValues;
    1.42 +    while (utf16be < end) {
    1.43 +        utf8.appendUnichar(SkUTF16BE_NextUnichar(&utf16be));
    1.44 +    }
    1.45 +}
    1.46 +
    1.47 +/** UnicodeFromMacRoman[macRomanPoint - 0x80] -> unicodeCodePoint.
    1.48 + *  Derived from http://www.unicode.org/Public/MAPPINGS/VENDORS/APPLE/ROMAN.TXT .
    1.49 + *  In MacRoman the first 128 code points match ASCII code points.
    1.50 + *  This maps the second 128 MacRoman code points to unicode code points.
    1.51 + */
    1.52 +static uint16_t UnicodeFromMacRoman[0x80] = {
    1.53 +    0x00C4, 0x00C5, 0x00C7, 0x00C9, 0x00D1, 0x00D6, 0x00DC, 0x00E1,
    1.54 +    0x00E0, 0x00E2, 0x00E4, 0x00E3, 0x00E5, 0x00E7, 0x00E9, 0x00E8,
    1.55 +    0x00EA, 0x00EB, 0x00ED, 0x00EC, 0x00EE, 0x00EF, 0x00F1, 0x00F3,
    1.56 +    0x00F2, 0x00F4, 0x00F6, 0x00F5, 0x00FA, 0x00F9, 0x00FB, 0x00FC,
    1.57 +    0x2020, 0x00B0, 0x00A2, 0x00A3, 0x00A7, 0x2022, 0x00B6, 0x00DF,
    1.58 +    0x00AE, 0x00A9, 0x2122, 0x00B4, 0x00A8, 0x2260, 0x00C6, 0x00D8,
    1.59 +    0x221E, 0x00B1, 0x2264, 0x2265, 0x00A5, 0x00B5, 0x2202, 0x2211,
    1.60 +    0x220F, 0x03C0, 0x222B, 0x00AA, 0x00BA, 0x03A9, 0x00E6, 0x00F8,
    1.61 +    0x00BF, 0x00A1, 0x00AC, 0x221A, 0x0192, 0x2248, 0x2206, 0x00AB,
    1.62 +    0x00BB, 0x2026, 0x00A0, 0x00C0, 0x00C3, 0x00D5, 0x0152, 0x0153,
    1.63 +    0x2013, 0x2014, 0x201C, 0x201D, 0x2018, 0x2019, 0x00F7, 0x25CA,
    1.64 +    0x00FF, 0x0178, 0x2044, 0x20AC, 0x2039, 0x203A, 0xFB01, 0xFB02,
    1.65 +    0x2021, 0x00B7, 0x201A, 0x201E, 0x2030, 0x00C2, 0x00CA, 0x00C1,
    1.66 +    0x00CB, 0x00C8, 0x00CD, 0x00CE, 0x00CF, 0x00CC, 0x00D3, 0x00D4,
    1.67 +    0xF8FF, 0x00D2, 0x00DA, 0x00DB, 0x00D9, 0x0131, 0x02C6, 0x02DC,
    1.68 +    0x00AF, 0x02D8, 0x02D9, 0x02DA, 0x00B8, 0x02DD, 0x02DB, 0x02C7,
    1.69 +};
    1.70 +
    1.71 +static void SkStringFromMacRoman(const uint8_t* macRoman, size_t length, SkString& utf8) {
    1.72 +    utf8.reset();
    1.73 +    for (size_t i = 0; i < length; ++i) {
    1.74 +        utf8.appendUnichar(macRoman[i] < 0x80 ? macRoman[i]
    1.75 +                                              : UnicodeFromMacRoman[macRoman[i] - 0x80]);
    1.76 +    }
    1.77 +}
    1.78 +
    1.79 +static struct BCP47FromLanguageId {
    1.80 +    uint16_t languageID;
    1.81 +    const char* bcp47;
    1.82 +}
    1.83 +/** The Mac and Windows values do not conflict, so this is currently one single table. */
    1.84 +BCP47FromLanguageID[] = {
    1.85 +    /** A mapping from Mac Language Designators to BCP 47 codes.
    1.86 +     *  The following list was constructed more or less manually.
    1.87 +     *  Apple now uses BCP 47 (post OSX10.4), so there will be no new entries.
    1.88 +     */
    1.89 +    {0, "en"}, //English
    1.90 +    {1, "fr"}, //French
    1.91 +    {2, "de"}, //German
    1.92 +    {3, "it"}, //Italian
    1.93 +    {4, "nl"}, //Dutch
    1.94 +    {5, "sv"}, //Swedish
    1.95 +    {6, "es"}, //Spanish
    1.96 +    {7, "da"}, //Danish
    1.97 +    {8, "pt"}, //Portuguese
    1.98 +    {9, "nb"}, //Norwegian
    1.99 +    {10, "he"}, //Hebrew
   1.100 +    {11, "ja"}, //Japanese
   1.101 +    {12, "ar"}, //Arabic
   1.102 +    {13, "fi"}, //Finnish
   1.103 +    {14, "el"}, //Greek
   1.104 +    {15, "is"}, //Icelandic
   1.105 +    {16, "mt"}, //Maltese
   1.106 +    {17, "tr"}, //Turkish
   1.107 +    {18, "hr"}, //Croatian
   1.108 +    {19, "zh-Hant"}, //Chinese (Traditional)
   1.109 +    {20, "ur"}, //Urdu
   1.110 +    {21, "hi"}, //Hindi
   1.111 +    {22, "th"}, //Thai
   1.112 +    {23, "ko"}, //Korean
   1.113 +    {24, "lt"}, //Lithuanian
   1.114 +    {25, "pl"}, //Polish
   1.115 +    {26, "hu"}, //Hungarian
   1.116 +    {27, "et"}, //Estonian
   1.117 +    {28, "lv"}, //Latvian
   1.118 +    {29, "se"}, //Sami
   1.119 +    {30, "fo"}, //Faroese
   1.120 +    {31, "fa"}, //Farsi (Persian)
   1.121 +    {32, "ru"}, //Russian
   1.122 +    {33, "zh-Hans"}, //Chinese (Simplified)
   1.123 +    {34, "nl"}, //Dutch
   1.124 +    {35, "ga"}, //Irish(Gaelic)
   1.125 +    {36, "sq"}, //Albanian
   1.126 +    {37, "ro"}, //Romanian
   1.127 +    {38, "cs"}, //Czech
   1.128 +    {39, "sk"}, //Slovak
   1.129 +    {40, "sl"}, //Slovenian
   1.130 +    {41, "yi"}, //Yiddish
   1.131 +    {42, "sr"}, //Serbian
   1.132 +    {43, "mk"}, //Macedonian
   1.133 +    {44, "bg"}, //Bulgarian
   1.134 +    {45, "uk"}, //Ukrainian
   1.135 +    {46, "be"}, //Byelorussian
   1.136 +    {47, "uz"}, //Uzbek
   1.137 +    {48, "kk"}, //Kazakh
   1.138 +    {49, "az-Cyrl"}, //Azerbaijani (Cyrillic)
   1.139 +    {50, "az-Arab"}, //Azerbaijani (Arabic)
   1.140 +    {51, "hy"}, //Armenian
   1.141 +    {52, "ka"}, //Georgian
   1.142 +    {53, "mo"}, //Moldavian
   1.143 +    {54, "ky"}, //Kirghiz
   1.144 +    {55, "tg"}, //Tajiki
   1.145 +    {56, "tk"}, //Turkmen
   1.146 +    {57, "mn-Mong"}, //Mongolian (Traditional)
   1.147 +    {58, "mn-Cyrl"}, //Mongolian (Cyrillic)
   1.148 +    {59, "ps"}, //Pashto
   1.149 +    {60, "ku"}, //Kurdish
   1.150 +    {61, "ks"}, //Kashmiri
   1.151 +    {62, "sd"}, //Sindhi
   1.152 +    {63, "bo"}, //Tibetan
   1.153 +    {64, "ne"}, //Nepali
   1.154 +    {65, "sa"}, //Sanskrit
   1.155 +    {66, "mr"}, //Marathi
   1.156 +    {67, "bn"}, //Bengali
   1.157 +    {68, "as"}, //Assamese
   1.158 +    {69, "gu"}, //Gujarati
   1.159 +    {70, "pa"}, //Punjabi
   1.160 +    {71, "or"}, //Oriya
   1.161 +    {72, "ml"}, //Malayalam
   1.162 +    {73, "kn"}, //Kannada
   1.163 +    {74, "ta"}, //Tamil
   1.164 +    {75, "te"}, //Telugu
   1.165 +    {76, "si"}, //Sinhalese
   1.166 +    {77, "my"}, //Burmese
   1.167 +    {78, "km"}, //Khmer
   1.168 +    {79, "lo"}, //Lao
   1.169 +    {80, "vi"}, //Vietnamese
   1.170 +    {81, "id"}, //Indonesian
   1.171 +    {82, "tl"}, //Tagalog
   1.172 +    {83, "ms-Latn"}, //Malay (Roman)
   1.173 +    {84, "ms-Arab"}, //Malay (Arabic)
   1.174 +    {85, "am"}, //Amharic
   1.175 +    {86, "ti"}, //Tigrinya
   1.176 +    {87, "om"}, //Oromo
   1.177 +    {88, "so"}, //Somali
   1.178 +    {89, "sw"}, //Swahili
   1.179 +    {90, "rw"}, //Kinyarwanda/Ruanda
   1.180 +    {91, "rn"}, //Rundi
   1.181 +    {92, "ny"}, //Nyanja/Chewa
   1.182 +    {93, "mg"}, //Malagasy
   1.183 +    {94, "eo"}, //Esperanto
   1.184 +    {128, "cy"}, //Welsh
   1.185 +    {129, "eu"}, //Basque
   1.186 +    {130, "ca"}, //Catalan
   1.187 +    {131, "la"}, //Latin
   1.188 +    {132, "qu"}, //Quechua
   1.189 +    {133, "gn"}, //Guarani
   1.190 +    {134, "ay"}, //Aymara
   1.191 +    {135, "tt"}, //Tatar
   1.192 +    {136, "ug"}, //Uighur
   1.193 +    {137, "dz"}, //Dzongkha
   1.194 +    {138, "jv-Latn"}, //Javanese (Roman)
   1.195 +    {139, "su-Latn"}, //Sundanese (Roman)
   1.196 +    {140, "gl"}, //Galician
   1.197 +    {141, "af"}, //Afrikaans
   1.198 +    {142, "br"}, //Breton
   1.199 +    {143, "iu"}, //Inuktitut
   1.200 +    {144, "gd"}, //Scottish (Gaelic)
   1.201 +    {145, "gv"}, //Manx (Gaelic)
   1.202 +    {146, "ga"}, //Irish (Gaelic with Lenition)
   1.203 +    {147, "to"}, //Tongan
   1.204 +    {148, "el"}, //Greek (Polytonic) Note: ISO 15924 does not have an equivalent script name.
   1.205 +    {149, "kl"}, //Greenlandic
   1.206 +    {150, "az-Latn"}, //Azerbaijani (Roman)
   1.207 +    {151, "nn"}, //Nynorsk
   1.208 +
   1.209 +    /** A mapping from Windows LCID to BCP 47 codes.
   1.210 +     *  This list is the sorted, curated output of tools/win_lcid.cpp.
   1.211 +     *  Note that these are sorted by value for quick binary lookup, and not logically by lsb.
   1.212 +     *  The 'bare' language ids (e.g. 0x0001 for Arabic) are ommitted
   1.213 +     *  as they do not appear as valid language ids in the OpenType specification.
   1.214 +     */
   1.215 +    { 0x0401, "ar-SA" }, //Arabic
   1.216 +    { 0x0402, "bg-BG" }, //Bulgarian
   1.217 +    { 0x0403, "ca-ES" }, //Catalan
   1.218 +    { 0x0404, "zh-TW" }, //Chinese (Traditional)
   1.219 +    { 0x0405, "cs-CZ" }, //Czech
   1.220 +    { 0x0406, "da-DK" }, //Danish
   1.221 +    { 0x0407, "de-DE" }, //German
   1.222 +    { 0x0408, "el-GR" }, //Greek
   1.223 +    { 0x0409, "en-US" }, //English
   1.224 +    { 0x040a, "es-ES_tradnl" }, //Spanish
   1.225 +    { 0x040b, "fi-FI" }, //Finnish
   1.226 +    { 0x040c, "fr-FR" }, //French
   1.227 +    { 0x040d, "he-IL" }, //Hebrew
   1.228 +    { 0x040d, "he" }, //Hebrew
   1.229 +    { 0x040e, "hu-HU" }, //Hungarian
   1.230 +    { 0x040e, "hu" }, //Hungarian
   1.231 +    { 0x040f, "is-IS" }, //Icelandic
   1.232 +    { 0x0410, "it-IT" }, //Italian
   1.233 +    { 0x0411, "ja-JP" }, //Japanese
   1.234 +    { 0x0412, "ko-KR" }, //Korean
   1.235 +    { 0x0413, "nl-NL" }, //Dutch
   1.236 +    { 0x0414, "nb-NO" }, //Norwegian (Bokmål)
   1.237 +    { 0x0415, "pl-PL" }, //Polish
   1.238 +    { 0x0416, "pt-BR" }, //Portuguese
   1.239 +    { 0x0417, "rm-CH" }, //Romansh
   1.240 +    { 0x0418, "ro-RO" }, //Romanian
   1.241 +    { 0x0419, "ru-RU" }, //Russian
   1.242 +    { 0x041a, "hr-HR" }, //Croatian
   1.243 +    { 0x041b, "sk-SK" }, //Slovak
   1.244 +    { 0x041c, "sq-AL" }, //Albanian
   1.245 +    { 0x041d, "sv-SE" }, //Swedish
   1.246 +    { 0x041e, "th-TH" }, //Thai
   1.247 +    { 0x041f, "tr-TR" }, //Turkish
   1.248 +    { 0x0420, "ur-PK" }, //Urdu
   1.249 +    { 0x0421, "id-ID" }, //Indonesian
   1.250 +    { 0x0422, "uk-UA" }, //Ukrainian
   1.251 +    { 0x0423, "be-BY" }, //Belarusian
   1.252 +    { 0x0424, "sl-SI" }, //Slovenian
   1.253 +    { 0x0425, "et-EE" }, //Estonian
   1.254 +    { 0x0426, "lv-LV" }, //Latvian
   1.255 +    { 0x0427, "lt-LT" }, //Lithuanian
   1.256 +    { 0x0428, "tg-Cyrl-TJ" }, //Tajik (Cyrillic)
   1.257 +    { 0x0429, "fa-IR" }, //Persian
   1.258 +    { 0x042a, "vi-VN" }, //Vietnamese
   1.259 +    { 0x042b, "hy-AM" }, //Armenian
   1.260 +    { 0x042c, "az-Latn-AZ" }, //Azeri (Latin)
   1.261 +    { 0x042d, "eu-ES" }, //Basque
   1.262 +    { 0x042e, "hsb-DE" }, //Upper Sorbian
   1.263 +    { 0x042f, "mk-MK" }, //Macedonian (FYROM)
   1.264 +    { 0x0432, "tn-ZA" }, //Setswana
   1.265 +    { 0x0434, "xh-ZA" }, //isiXhosa
   1.266 +    { 0x0435, "zu-ZA" }, //isiZulu
   1.267 +    { 0x0436, "af-ZA" }, //Afrikaans
   1.268 +    { 0x0437, "ka-GE" }, //Georgian
   1.269 +    { 0x0438, "fo-FO" }, //Faroese
   1.270 +    { 0x0439, "hi-IN" }, //Hindi
   1.271 +    { 0x043a, "mt-MT" }, //Maltese
   1.272 +    { 0x043b, "se-NO" }, //Sami (Northern)
   1.273 +    { 0x043e, "ms-MY" }, //Malay
   1.274 +    { 0x043f, "kk-KZ" }, //Kazakh
   1.275 +    { 0x0440, "ky-KG" }, //Kyrgyz
   1.276 +    { 0x0441, "sw-KE" }, //Kiswahili
   1.277 +    { 0x0442, "tk-TM" }, //Turkmen
   1.278 +    { 0x0443, "uz-Latn-UZ" }, //Uzbek (Latin)
   1.279 +    { 0x0443, "uz" }, //Uzbek
   1.280 +    { 0x0444, "tt-RU" }, //Tatar
   1.281 +    { 0x0445, "bn-IN" }, //Bengali
   1.282 +    { 0x0446, "pa-IN" }, //Punjabi
   1.283 +    { 0x0447, "gu-IN" }, //Gujarati
   1.284 +    { 0x0448, "or-IN" }, //Oriya
   1.285 +    { 0x0449, "ta-IN" }, //Tamil
   1.286 +    { 0x044a, "te-IN" }, //Telugu
   1.287 +    { 0x044b, "kn-IN" }, //Kannada
   1.288 +    { 0x044c, "ml-IN" }, //Malayalam
   1.289 +    { 0x044d, "as-IN" }, //Assamese
   1.290 +    { 0x044e, "mr-IN" }, //Marathi
   1.291 +    { 0x044f, "sa-IN" }, //Sanskrit
   1.292 +    { 0x0450, "mn-Cyrl" }, //Mongolian (Cyrillic)
   1.293 +    { 0x0451, "bo-CN" }, //Tibetan
   1.294 +    { 0x0452, "cy-GB" }, //Welsh
   1.295 +    { 0x0453, "km-KH" }, //Khmer
   1.296 +    { 0x0454, "lo-LA" }, //Lao
   1.297 +    { 0x0456, "gl-ES" }, //Galician
   1.298 +    { 0x0457, "kok-IN" }, //Konkani
   1.299 +    { 0x045a, "syr-SY" }, //Syriac
   1.300 +    { 0x045b, "si-LK" }, //Sinhala
   1.301 +    { 0x045d, "iu-Cans-CA" }, //Inuktitut (Syllabics)
   1.302 +    { 0x045e, "am-ET" }, //Amharic
   1.303 +    { 0x0461, "ne-NP" }, //Nepali
   1.304 +    { 0x0462, "fy-NL" }, //Frisian
   1.305 +    { 0x0463, "ps-AF" }, //Pashto
   1.306 +    { 0x0464, "fil-PH" }, //Filipino
   1.307 +    { 0x0465, "dv-MV" }, //Divehi
   1.308 +    { 0x0468, "ha-Latn-NG" }, //Hausa (Latin)
   1.309 +    { 0x046a, "yo-NG" }, //Yoruba
   1.310 +    { 0x046b, "quz-BO" }, //Quechua
   1.311 +    { 0x046c, "nso-ZA" }, //Sesotho sa Leboa
   1.312 +    { 0x046d, "ba-RU" }, //Bashkir
   1.313 +    { 0x046e, "lb-LU" }, //Luxembourgish
   1.314 +    { 0x046f, "kl-GL" }, //Greenlandic
   1.315 +    { 0x0470, "ig-NG" }, //Igbo
   1.316 +    { 0x0478, "ii-CN" }, //Yi
   1.317 +    { 0x047a, "arn-CL" }, //Mapudungun
   1.318 +    { 0x047c, "moh-CA" }, //Mohawk
   1.319 +    { 0x047e, "br-FR" }, //Breton
   1.320 +    { 0x0480, "ug-CN" }, //Uyghur
   1.321 +    { 0x0481, "mi-NZ" }, //Maori
   1.322 +    { 0x0482, "oc-FR" }, //Occitan
   1.323 +    { 0x0483, "co-FR" }, //Corsican
   1.324 +    { 0x0484, "gsw-FR" }, //Alsatian
   1.325 +    { 0x0485, "sah-RU" }, //Yakut
   1.326 +    { 0x0486, "qut-GT" }, //K'iche
   1.327 +    { 0x0487, "rw-RW" }, //Kinyarwanda
   1.328 +    { 0x0488, "wo-SN" }, //Wolof
   1.329 +    { 0x048c, "prs-AF" }, //Dari
   1.330 +    { 0x0491, "gd-GB" }, //Scottish Gaelic
   1.331 +    { 0x0801, "ar-IQ" }, //Arabic
   1.332 +    { 0x0804, "zh-Hans" }, //Chinese (Simplified)
   1.333 +    { 0x0807, "de-CH" }, //German
   1.334 +    { 0x0809, "en-GB" }, //English
   1.335 +    { 0x080a, "es-MX" }, //Spanish
   1.336 +    { 0x080c, "fr-BE" }, //French
   1.337 +    { 0x0810, "it-CH" }, //Italian
   1.338 +    { 0x0813, "nl-BE" }, //Dutch
   1.339 +    { 0x0814, "nn-NO" }, //Norwegian (Nynorsk)
   1.340 +    { 0x0816, "pt-PT" }, //Portuguese
   1.341 +    { 0x081a, "sr-Latn-CS" }, //Serbian (Latin)
   1.342 +    { 0x081d, "sv-FI" }, //Swedish
   1.343 +    { 0x082c, "az-Cyrl-AZ" }, //Azeri (Cyrillic)
   1.344 +    { 0x082e, "dsb-DE" }, //Lower Sorbian
   1.345 +    { 0x082e, "dsb" }, //Lower Sorbian
   1.346 +    { 0x083b, "se-SE" }, //Sami (Northern)
   1.347 +    { 0x083c, "ga-IE" }, //Irish
   1.348 +    { 0x083e, "ms-BN" }, //Malay
   1.349 +    { 0x0843, "uz-Cyrl-UZ" }, //Uzbek (Cyrillic)
   1.350 +    { 0x0845, "bn-BD" }, //Bengali
   1.351 +    { 0x0850, "mn-Mong-CN" }, //Mongolian (Traditional Mongolian)
   1.352 +    { 0x085d, "iu-Latn-CA" }, //Inuktitut (Latin)
   1.353 +    { 0x085f, "tzm-Latn-DZ" }, //Tamazight (Latin)
   1.354 +    { 0x086b, "quz-EC" }, //Quechua
   1.355 +    { 0x0c01, "ar-EG" }, //Arabic
   1.356 +    { 0x0c04, "zh-Hant" }, //Chinese (Traditional)
   1.357 +    { 0x0c07, "de-AT" }, //German
   1.358 +    { 0x0c09, "en-AU" }, //English
   1.359 +    { 0x0c0a, "es-ES" }, //Spanish
   1.360 +    { 0x0c0c, "fr-CA" }, //French
   1.361 +    { 0x0c1a, "sr-Cyrl-CS" }, //Serbian (Cyrillic)
   1.362 +    { 0x0c3b, "se-FI" }, //Sami (Northern)
   1.363 +    { 0x0c6b, "quz-PE" }, //Quechua
   1.364 +    { 0x1001, "ar-LY" }, //Arabic
   1.365 +    { 0x1004, "zh-SG" }, //Chinese (Simplified)
   1.366 +    { 0x1007, "de-LU" }, //German
   1.367 +    { 0x1009, "en-CA" }, //English
   1.368 +    { 0x100a, "es-GT" }, //Spanish
   1.369 +    { 0x100c, "fr-CH" }, //French
   1.370 +    { 0x101a, "hr-BA" }, //Croatian (Latin)
   1.371 +    { 0x103b, "smj-NO" }, //Sami (Lule)
   1.372 +    { 0x1401, "ar-DZ" }, //Arabic
   1.373 +    { 0x1404, "zh-MO" }, //Chinese (Traditional)
   1.374 +    { 0x1407, "de-LI" }, //German
   1.375 +    { 0x1409, "en-NZ" }, //English
   1.376 +    { 0x140a, "es-CR" }, //Spanish
   1.377 +    { 0x140c, "fr-LU" }, //French
   1.378 +    { 0x141a, "bs-Latn-BA" }, //Bosnian (Latin)
   1.379 +    { 0x141a, "bs" }, //Bosnian
   1.380 +    { 0x143b, "smj-SE" }, //Sami (Lule)
   1.381 +    { 0x143b, "smj" }, //Sami (Lule)
   1.382 +    { 0x1801, "ar-MA" }, //Arabic
   1.383 +    { 0x1809, "en-IE" }, //English
   1.384 +    { 0x180a, "es-PA" }, //Spanish
   1.385 +    { 0x180c, "fr-MC" }, //French
   1.386 +    { 0x181a, "sr-Latn-BA" }, //Serbian (Latin)
   1.387 +    { 0x183b, "sma-NO" }, //Sami (Southern)
   1.388 +    { 0x1c01, "ar-TN" }, //Arabic
   1.389 +    { 0x1c09, "en-ZA" }, //English
   1.390 +    { 0x1c0a, "es-DO" }, //Spanish
   1.391 +    { 0x1c1a, "sr-Cyrl-BA" }, //Serbian (Cyrillic)
   1.392 +    { 0x1c3b, "sma-SE" }, //Sami (Southern)
   1.393 +    { 0x1c3b, "sma" }, //Sami (Southern)
   1.394 +    { 0x2001, "ar-OM" }, //Arabic
   1.395 +    { 0x2009, "en-JM" }, //English
   1.396 +    { 0x200a, "es-VE" }, //Spanish
   1.397 +    { 0x201a, "bs-Cyrl-BA" }, //Bosnian (Cyrillic)
   1.398 +    { 0x201a, "bs-Cyrl" }, //Bosnian (Cyrillic)
   1.399 +    { 0x203b, "sms-FI" }, //Sami (Skolt)
   1.400 +    { 0x203b, "sms" }, //Sami (Skolt)
   1.401 +    { 0x2401, "ar-YE" }, //Arabic
   1.402 +    { 0x2409, "en-029" }, //English
   1.403 +    { 0x240a, "es-CO" }, //Spanish
   1.404 +    { 0x241a, "sr-Latn-RS" }, //Serbian (Latin)
   1.405 +    { 0x243b, "smn-FI" }, //Sami (Inari)
   1.406 +    { 0x2801, "ar-SY" }, //Arabic
   1.407 +    { 0x2809, "en-BZ" }, //English
   1.408 +    { 0x280a, "es-PE" }, //Spanish
   1.409 +    { 0x281a, "sr-Cyrl-RS" }, //Serbian (Cyrillic)
   1.410 +    { 0x2c01, "ar-JO" }, //Arabic
   1.411 +    { 0x2c09, "en-TT" }, //English
   1.412 +    { 0x2c0a, "es-AR" }, //Spanish
   1.413 +    { 0x2c1a, "sr-Latn-ME" }, //Serbian (Latin)
   1.414 +    { 0x3001, "ar-LB" }, //Arabic
   1.415 +    { 0x3009, "en-ZW" }, //English
   1.416 +    { 0x300a, "es-EC" }, //Spanish
   1.417 +    { 0x301a, "sr-Cyrl-ME" }, //Serbian (Cyrillic)
   1.418 +    { 0x3401, "ar-KW" }, //Arabic
   1.419 +    { 0x3409, "en-PH" }, //English
   1.420 +    { 0x340a, "es-CL" }, //Spanish
   1.421 +    { 0x3801, "ar-AE" }, //Arabic
   1.422 +    { 0x380a, "es-UY" }, //Spanish
   1.423 +    { 0x3c01, "ar-BH" }, //Arabic
   1.424 +    { 0x3c0a, "es-PY" }, //Spanish
   1.425 +    { 0x4001, "ar-QA" }, //Arabic
   1.426 +    { 0x4009, "en-IN" }, //English
   1.427 +    { 0x400a, "es-BO" }, //Spanish
   1.428 +    { 0x4409, "en-MY" }, //English
   1.429 +    { 0x440a, "es-SV" }, //Spanish
   1.430 +    { 0x4809, "en-SG" }, //English
   1.431 +    { 0x480a, "es-HN" }, //Spanish
   1.432 +    { 0x4c0a, "es-NI" }, //Spanish
   1.433 +    { 0x500a, "es-PR" }, //Spanish
   1.434 +    { 0x540a, "es-US" }, //Spanish
   1.435 +};
   1.436 +
   1.437 +namespace {
   1.438 +bool BCP47FromLanguageIdLess(const BCP47FromLanguageId& a, const BCP47FromLanguageId& b) {
   1.439 +    return a.languageID < b.languageID;
   1.440 +}
   1.441 +}
   1.442 +
   1.443 +bool SkOTTableName::Iterator::next(SkOTTableName::Iterator::Record& record) {
   1.444 +    const size_t nameRecordsCount = SkEndian_SwapBE16(fName.count);
   1.445 +    const SkOTTableName::Record* nameRecords = SkTAfter<const SkOTTableName::Record>(&fName);
   1.446 +    const SkOTTableName::Record* nameRecord;
   1.447 +
   1.448 +    // Find the next record which matches the requested type.
   1.449 +    do {
   1.450 +        if (fIndex >= nameRecordsCount) {
   1.451 +            return false;
   1.452 +        }
   1.453 +
   1.454 +        nameRecord = &nameRecords[fIndex];
   1.455 +        ++fIndex;
   1.456 +    } while (fType != -1 && nameRecord->nameID.fontSpecific != fType);
   1.457 +
   1.458 +    record.type = nameRecord->nameID.fontSpecific;
   1.459 +
   1.460 +    const uint16_t stringTableOffset = SkEndian_SwapBE16(fName.stringOffset);
   1.461 +    const char* stringTable = SkTAddOffset<const char>(&fName, stringTableOffset);
   1.462 +
   1.463 +    // Decode the name into UTF-8.
   1.464 +    const uint16_t nameOffset = SkEndian_SwapBE16(nameRecord->offset);
   1.465 +    const uint16_t nameLength = SkEndian_SwapBE16(nameRecord->length);
   1.466 +    const char* nameString = SkTAddOffset<const char>(stringTable, nameOffset);
   1.467 +    switch (nameRecord->platformID.value) {
   1.468 +        case SkOTTableName::Record::PlatformID::Windows:
   1.469 +            if (SkOTTableName::Record::EncodingID::Windows::UnicodeBMPUCS2
   1.470 +                   != nameRecord->encodingID.windows.value
   1.471 +                && SkOTTableName::Record::EncodingID::Windows::UnicodeUCS4
   1.472 +                   != nameRecord->encodingID.windows.value
   1.473 +                && SkOTTableName::Record::EncodingID::Windows::Symbol
   1.474 +                   != nameRecord->encodingID.windows.value)
   1.475 +            {
   1.476 +                record.name.reset();
   1.477 +                break;
   1.478 +            }
   1.479 +        case SkOTTableName::Record::PlatformID::Unicode:
   1.480 +        case SkOTTableName::Record::PlatformID::ISO:
   1.481 +            SkStringFromUTF16BE((const uint16_t*)nameString, nameLength, record.name);
   1.482 +            break;
   1.483 +
   1.484 +        case SkOTTableName::Record::PlatformID::Macintosh:
   1.485 +            // TODO: need better decoding, especially on Mac.
   1.486 +            if (SkOTTableName::Record::EncodingID::Macintosh::Roman
   1.487 +                != nameRecord->encodingID.macintosh.value)
   1.488 +            {
   1.489 +                record.name.reset();
   1.490 +                break;
   1.491 +            }
   1.492 +            SkStringFromMacRoman((const uint8_t*)nameString, nameLength, record.name);
   1.493 +            break;
   1.494 +
   1.495 +        case SkOTTableName::Record::PlatformID::Custom:
   1.496 +            // These should never appear in a 'name' table.
   1.497 +        default:
   1.498 +            SkASSERT(false);
   1.499 +            record.name.reset();
   1.500 +            break;
   1.501 +    }
   1.502 +
   1.503 +    // Determine the language.
   1.504 +    const uint16_t languageID = SkEndian_SwapBE16(nameRecord->languageID.languageTagID);
   1.505 +
   1.506 +    // Handle format 1 languages.
   1.507 +    if (SkOTTableName::format_1 == fName.format && languageID >= 0x8000) {
   1.508 +        const uint16_t languageTagRecordIndex = languageID - 0x8000;
   1.509 +
   1.510 +        const SkOTTableName::Format1Ext* format1ext =
   1.511 +            SkTAfter<const SkOTTableName::Format1Ext>(nameRecords, nameRecordsCount);
   1.512 +
   1.513 +        if (languageTagRecordIndex < SkEndian_SwapBE16(format1ext->langTagCount)) {
   1.514 +            const SkOTTableName::Format1Ext::LangTagRecord* languageTagRecord =
   1.515 +                SkTAfter<const SkOTTableName::Format1Ext::LangTagRecord>(format1ext);
   1.516 +
   1.517 +            uint16_t offset = SkEndian_SwapBE16(languageTagRecord[languageTagRecordIndex].offset);
   1.518 +            uint16_t length = SkEndian_SwapBE16(languageTagRecord[languageTagRecordIndex].length);
   1.519 +            const uint16_t* string = SkTAddOffset<const uint16_t>(stringTable, offset);
   1.520 +            SkStringFromUTF16BE(string, length, record.language);
   1.521 +            return true;
   1.522 +        }
   1.523 +    }
   1.524 +
   1.525 +    // Handle format 0 languages, translating them into BCP 47.
   1.526 +    const BCP47FromLanguageId target = { languageID, "" };
   1.527 +    int languageIndex = SkTSearch<BCP47FromLanguageId, BCP47FromLanguageIdLess>(
   1.528 +        BCP47FromLanguageID, SK_ARRAY_COUNT(BCP47FromLanguageID), target, sizeof(target));
   1.529 +    if (languageIndex >= 0) {
   1.530 +        record.language = BCP47FromLanguageID[languageIndex].bcp47;
   1.531 +        return true;
   1.532 +    }
   1.533 +
   1.534 +    // Unknown language, return the BCP 47 code 'und' for 'undetermined'.
   1.535 +    record.language = "und";
   1.536 +    return true;
   1.537 +}

mercurial