diff options
author | Edward Welbourne <edward.welbourne@qt.io> | 2020-10-08 16:00:36 +0200 |
---|---|---|
committer | Edward Welbourne <edward.welbourne@qt.io> | 2020-11-08 13:01:18 +0100 |
commit | 4ab6358039309b7a3610db5f960d5311e8c57627 (patch) | |
tree | 771a453d95bbf9eb740ba392f81d5b5fa934cb5c /util | |
parent | 73ceb715767ea43d9243f1888661d835cf3c33e9 (diff) |
Reorder locale enums alphabetically
Binary-incompatible change: change the numeric values of QLocale's
Language, Script and Country enums, as encouraged by a comment in the
generator script enumdata.py and clarify documentation around that.
In the process (since I was changing almost every line anyway),
convert the dictionary values from (mutable) lists of length two to
tuples, since they are (and should be) immutable data.
Change-Id: I26222bce45b9f5074b1d81ed70015a75ac34adcd
Reviewed-by: Mårten Nordheim <marten.nordheim@qt.io>
Diffstat (limited to 'util')
-rwxr-xr-x | util/locale_database/cldr2qtimezone.py | 2 | ||||
-rw-r--r-- | util/locale_database/enumdata.py | 1473 |
2 files changed, 741 insertions, 734 deletions
diff --git a/util/locale_database/cldr2qtimezone.py b/util/locale_database/cldr2qtimezone.py index 4695c0d162..98076e2ec1 100755 --- a/util/locale_database/cldr2qtimezone.py +++ b/util/locale_database/cldr2qtimezone.py @@ -324,7 +324,7 @@ class ZoneIdWriter (SourceFileEditor): return windowsIdData, ianaIdData def usage(err, name, message=''): - err.write("""Usage: {} path/to/cldr/core/common path/to/qtbase + err.write("""Usage: {} path/to/cldr/root path/to/qtbase """.format(name)) # TODO: more interesting message if message: err.write('\n' + message + '\n') diff --git a/util/locale_database/enumdata.py b/util/locale_database/enumdata.py index f4216bee8a..f20ac974ee 100644 --- a/util/locale_database/enumdata.py +++ b/util/locale_database/enumdata.py @@ -41,337 +41,342 @@ # shall squish them out for the enum entries) in *_list, but use the # squished forms of names in the *_aliases mappings. -### Qt 6: restore alphabetic order in each list. +# For a new major version (and only then), we can change the +# numbering, so re-sort each list into alphabetic order (e.g. using +# sort -k2); but keep the Any and C entries first. That's why those +# are offset with a blank line, below. After doing that, regenerate +# locale data as usual; this will cause a binary-incompatible change. language_list = { - 0: ["AnyLanguage", " "], - 1: ["C", " "], - 2: ["Abkhazian", "ab"], - 3: ["Oromo", "om"], # macrolanguage - 4: ["Afar", "aa"], - 5: ["Afrikaans", "af"], - 6: ["Albanian", "sq"], # macrolanguage - 7: ["Amharic", "am"], - 8: ["Arabic", "ar"], # macrolanguage - 9: ["Armenian", "hy"], - 10: ["Assamese", "as"], - 11: ["Aymara", "ay"], # macrolanguage - 12: ["Azerbaijani", "az"], # macrolanguage - 13: ["Bashkir", "ba"], - 14: ["Basque", "eu"], - 15: ["Bangla", "bn"], - 16: ["Dzongkha", "dz"], - 18: ["Bislama", "bi"], - 19: ["Breton", "br"], - 20: ["Bulgarian", "bg"], - 21: ["Burmese", "my"], - 22: ["Belarusian", "be"], - 23: ["Khmer", "km"], - 24: ["Catalan", "ca"], - 25: ["Chinese", "zh"], # macrolanguage - 26: ["Corsican", "co"], - 27: ["Croatian", "hr"], - 28: ["Czech", "cs"], - 29: ["Danish", "da"], - 30: ["Dutch", "nl"], - 31: ["English", "en"], - 32: ["Esperanto", "eo"], - 33: ["Estonian", "et"], # macrolanguage - 34: ["Faroese", "fo"], - 35: ["Fijian", "fj"], - 36: ["Finnish", "fi"], - 37: ["French", "fr"], - 38: ["Western Frisian", "fy"], - 39: ["Gaelic", "gd"], - 40: ["Galician", "gl"], - 41: ["Georgian", "ka"], - 42: ["German", "de"], - 43: ["Greek", "el"], - 44: ["Kalaallisut", "kl"], - 45: ["Guarani", "gn"], # macrolanguage - 46: ["Gujarati", "gu"], - 47: ["Hausa", "ha"], - 48: ["Hebrew", "he"], - 49: ["Hindi", "hi"], - 50: ["Hungarian", "hu"], - 51: ["Icelandic", "is"], - 52: ["Indonesian", "id"], - 53: ["Interlingua", "ia"], - 54: ["Interlingue", "ie"], - 55: ["Inuktitut", "iu"], # macrolanguage - 56: ["Inupiaq", "ik"], # macrolanguage - 57: ["Irish", "ga"], - 58: ["Italian", "it"], - 59: ["Japanese", "ja"], - 60: ["Javanese", "jv"], - 61: ["Kannada", "kn"], - 62: ["Kashmiri", "ks"], - 63: ["Kazakh", "kk"], - 64: ["Kinyarwanda", "rw"], - 65: ["Kyrgyz", "ky"], - 66: ["Korean", "ko"], - 67: ["Kurdish", "ku"], # macrolanguage - 68: ["Rundi", "rn"], - 69: ["Lao", "lo"], - 70: ["Latin", "la"], - 71: ["Latvian", "lv"], # macrolanguage - 72: ["Lingala", "ln"], - 73: ["Lithuanian", "lt"], - 74: ["Macedonian", "mk"], - 75: ["Malagasy", "mg"], # macrolanguage - 76: ["Malay", "ms"], # macrolanguage - 77: ["Malayalam", "ml"], - 78: ["Maltese", "mt"], - 79: ["Maori", "mi"], - 80: ["Marathi", "mr"], - 81: ["Marshallese", "mh"], - 82: ["Mongolian", "mn"], # macrolanguage - 83: ["Nauru", "na"], - 84: ["Nepali", "ne"], # macrolanguage - 85: ["Norwegian Bokmal", "nb"], - 86: ["Occitan", "oc"], - 87: ["Odia", "or"], # macrolanguage - 88: ["Pashto", "ps"], # macrolanguage - 89: ["Persian", "fa"], # macrolanguage - 90: ["Polish", "pl"], - 91: ["Portuguese", "pt"], - 92: ["Punjabi", "pa"], - 93: ["Quechua", "qu"], # macrolanguage - 94: ["Romansh", "rm"], - 95: ["Romanian", "ro"], - 96: ["Russian", "ru"], - 97: ["Samoan", "sm"], - 98: ["Sango", "sg"], - 99: ["Sanskrit", "sa"], - 100: ["Serbian", "sr"], - 101: ["Ossetic", "os"], - 102: ["Southern Sotho", "st"], - 103: ["Tswana", "tn"], - 104: ["Shona", "sn"], - 105: ["Sindhi", "sd"], - 106: ["Sinhala", "si"], - 107: ["Swati", "ss"], - 108: ["Slovak", "sk"], - 109: ["Slovenian", "sl"], - 110: ["Somali", "so"], - 111: ["Spanish", "es"], - 112: ["Sundanese", "su"], - 113: ["Swahili", "sw"], # macrolanguage - 114: ["Swedish", "sv"], - 115: ["Sardinian", "sc"], # macrolanguage - 116: ["Tajik", "tg"], - 117: ["Tamil", "ta"], - 118: ["Tatar", "tt"], - 119: ["Telugu", "te"], - 120: ["Thai", "th"], - 121: ["Tibetan", "bo"], - 122: ["Tigrinya", "ti"], - 123: ["Tongan", "to"], - 124: ["Tsonga", "ts"], - 125: ["Turkish", "tr"], - 126: ["Turkmen", "tk"], - 127: ["Tahitian", "ty"], - 128: ["Uyghur", "ug"], - 129: ["Ukrainian", "uk"], - 130: ["Urdu", "ur"], - 131: ["Uzbek", "uz"], # macrolanguage - 132: ["Vietnamese", "vi"], - 133: ["Volapuk", "vo"], - 134: ["Welsh", "cy"], - 135: ["Wolof", "wo"], - 136: ["Xhosa", "xh"], - 137: ["Yiddish", "yi"], # macrolanguage - 138: ["Yoruba", "yo"], - 139: ["Zhuang", "za"], # macrolanguage - 140: ["Zulu", "zu"], - 141: ["Norwegian Nynorsk", "nn"], - 142: ["Bosnian", "bs"], - 143: ["Divehi", "dv"], - 144: ["Manx", "gv"], - 145: ["Cornish", "kw"], - 146: ["Akan", "ak"], # macrolanguage - 147: ["Konkani", "kok"], - 148: ["Ga", "gaa"], - 149: ["Igbo", "ig" ], - 150: ["Kamba", "kam"], - 151: ["Syriac", "syr"], - 152: ["Blin", "byn"], - 153: ["Geez", "gez"], - 154: ["Koro", "kfo"], - 155: ["Sidamo", "sid"], - 156: ["Atsam", "cch"], - 157: ["Tigre", "tig"], - 158: ["Jju", "kaj"], - 159: ["Friulian", "fur"], - 160: ["Venda", "ve" ], - 161: ["Ewe", "ee" ], - 162: ["Wolaytta", "wal"], - 163: ["Hawaiian", "haw"], - 164: ["Tyap", "kcg"], - 165: ["Nyanja", "ny" ], - 166: ["Filipino", "fil"], - 167: ["Swiss German", "gsw"], - 168: ["Sichuan Yi", "ii" ], - 169: ["Kpelle", "kpe"], - 170: ["Low German", "nds"], - 171: ["South Ndebele", "nr" ], - 172: ["Northern Sotho", "nso"], - 173: ["Northern Sami", "se" ], - 174: ["Taroko", "trv"], - 175: ["Gusii", "guz"], - 176: ["Taita", "dav"], - 177: ["Fulah", "ff"], # macrolanguage - 178: ["Kikuyu", "ki"], - 179: ["Samburu", "saq"], - 180: ["Sena", "seh"], - 181: ["North Ndebele", "nd"], - 182: ["Rombo", "rof"], - 183: ["Tachelhit", "shi"], - 184: ["Kabyle", "kab"], - 185: ["Nyankole", "nyn"], - 186: ["Bena", "bez"], - 187: ["Vunjo", "vun"], - 188: ["Bambara", "bm"], - 189: ["Embu", "ebu"], - 190: ["Cherokee", "chr"], - 191: ["Morisyen", "mfe"], - 192: ["Makonde", "kde"], - 193: ["Langi", "lag"], - 194: ["Ganda", "lg"], - 195: ["Bemba", "bem"], - 196: ["Kabuverdianu", "kea"], - 197: ["Meru", "mer"], - 198: ["Kalenjin", "kln"], - 199: ["Nama", "naq"], - 200: ["Machame", "jmc"], - 201: ["Colognian", "ksh"], - 202: ["Masai", "mas"], - 203: ["Soga", "xog"], - 204: ["Luyia", "luy"], - 205: ["Asu", "asa"], - 206: ["Teso", "teo"], - 207: ["Saho", "ssy"], - 208: ["Koyra Chiini", "khq"], - 209: ["Rwa", "rwk"], - 210: ["Luo", "luo"], - 211: ["Chiga", "cgg"], - 212: ["Central Atlas Tamazight", "tzm"], - 213: ["Koyraboro Senni", "ses"], - 214: ["Shambala", "ksb"], - 215: ["Bodo", "brx"], - 216: ["Avaric", "av"], - 217: ["Chamorro", "ch"], - 218: ["Chechen", "ce"], - 219: ["Church", "cu"], # macrolanguage - 220: ["Chuvash", "cv"], - 221: ["Cree", "cr"], # macrolanguage - 222: ["Haitian", "ht"], - 223: ["Herero", "hz"], - 224: ["Hiri Motu", "ho"], - 225: ["Kanuri", "kr"], # macrolanguage - 226: ["Komi", "kv"], # macrolanguage - 227: ["Kongo", "kg"], # macrolanguage - 228: ["Kuanyama", "kj"], - 229: ["Limburgish", "li"], - 230: ["Luba Katanga", "lu"], - 231: ["Luxembourgish", "lb"], - 232: ["Navajo", "nv"], - 233: ["Ndonga", "ng"], - 234: ["Ojibwa", "oj"], # macrolanguage - 235: ["Pali", "pi"], # macrolanguage - 236: ["Walloon", "wa"], - 237: ["Aghem", "agq"], - 238: ["Basaa", "bas"], - 239: ["Zarma", "dje"], - 240: ["Duala", "dua"], - 241: ["Jola Fonyi", "dyo"], - 242: ["Ewondo", "ewo"], - 243: ["Bafia", "ksf"], - 244: ["Makhuwa Meetto", "mgh"], - 245: ["Mundang", "mua"], - 246: ["Kwasio", "nmg"], - 247: ["Nuer", "nus"], - 248: ["Sakha", "sah"], - 249: ["Sangu", "sbp"], - 251: ["Tasawaq", "twq"], - 252: ["Vai", "vai"], - 253: ["Walser", "wae"], - 254: ["Yangben", "yav"], - 255: ["Avestan", "ae"], - 256: ["Asturian", "ast"], - 257: ["Ngomba", "jgo"], - 258: ["Kako", "kkj"], - 259: ["Meta", "mgo"], - 260: ["Ngiemboon", "nnh"], - 261: ["Aragonese", "an"], - 262: ["Akkadian", "akk"], - 263: ["Ancient Egyptian", "egy"], - 264: ["Ancient Greek", "grc"], - 265: ["Aramaic", "arc"], - 266: ["Balinese", "ban"], - 267: ["Bamun", "bax"], - 268: ["Batak Toba", "bbc"], - 269: ["Buginese", "bug"], - 272: ["Chakma", "ccp"], - 274: ["Coptic", "cop"], - 275: ["Dogri", "doi"], # macrolanguage - 279: ["Gothic", "got"], - 281: ["Ingush", "inh"], - 289: ["Mandingo", "man"], # macrolanguage - 290: ["Manipuri", "mni"], - 293: ["Old Irish", "sga"], - 294: ["Old Norse", "non"], - 295: ["Old Persian", "peo"], - 297: ["Pahlavi", "pal"], - 299: ["Phoenician", "phn"], - 304: ["Santali", "sat"], - 305: ["Saurashtra", "saz"], - 309: ["Tai Dam", "blt"], - 311: ["Ugaritic", "uga"], - 312: ["Akoose", "bss"], - 313: ["Lakota", "lkt"], - 314: ["Standard Moroccan Tamazight", "zgh"], - 315: ["Mapuche", "arn"], - 316: ["Central Kurdish", "ckb"], - 317: ["Lower Sorbian", "dsb"], - 318: ["Upper Sorbian", "hsb"], - 319: ["Kenyang", "ken"], - 320: ["Mohawk", "moh"], - 321: ["Nko", "nqo"], - 322: ["Prussian", "prg"], - 323: ["Kiche", "quc"], - 324: ["Southern Sami", "sma"], - 325: ["Lule Sami", "smj"], - 326: ["Inari Sami", "smn"], - 327: ["Skolt Sami", "sms"], - 328: ["Warlpiri", "wbp"], - 330: ["Mende", "men"], - 335: ["Lezghian", "lez"], - 339: ["Maithili", "mai"], - 341: ["American Sign Language", "ase"], - 343: ["Bhojpuri", "bho"], - 345: ["Literary Chinese", "lzh"], - 346: ["Mazanderani", "mzn"], - 348: ["Newari", "new"], - 349: ["Northern Luri", "lrc"], - 350: ["Palauan", "pau"], - 351: ["Papiamento", "pap"], - 353: ["Tokelau", "tkl"], - 354: ["Tok Pisin", "tpi"], - 355: ["Tuvalu", "tvl"], - 357: ["Cantonese", "yue"], - 358: ["Osage", "osa"], - 360: ["Ido", "io"], - 361: ["Lojban", "jbo"], - 362: ["Sicilian", "scn"], - 363: ["Southern Kurdish", "sdh"], - 364: ["Western Balochi", "bgn"], - 365: ["Cebuano", "ceb"], - 366: ["Erzya", "myv"], - 367: ["Chickasaw", "cic"], - 368: ["Muscogee", "mus"], - 369: ["Silesian", "szl"], - 370: ["Nigerian Pidgin", "pcm"], + 0: ("AnyLanguage", " "), + 1: ("C", " "), + + 2: ("Abkhazian", "ab"), + 3: ("Afar", "aa"), + 4: ("Afrikaans", "af"), + 5: ("Aghem", "agq"), + 6: ("Akan", "ak"), # macrolanguage + 7: ("Akkadian", "akk"), + 8: ("Akoose", "bss"), + 9: ("Albanian", "sq"), # macrolanguage + 10: ("American Sign Language", "ase"), + 11: ("Amharic", "am"), + 12: ("Ancient Egyptian", "egy"), + 13: ("Ancient Greek", "grc"), + 14: ("Arabic", "ar"), # macrolanguage + 15: ("Aragonese", "an"), + 16: ("Aramaic", "arc"), + 17: ("Armenian", "hy"), + 18: ("Assamese", "as"), + 19: ("Asturian", "ast"), + 20: ("Asu", "asa"), + 21: ("Atsam", "cch"), + 22: ("Avaric", "av"), + 23: ("Avestan", "ae"), + 24: ("Aymara", "ay"), # macrolanguage + 25: ("Azerbaijani", "az"), # macrolanguage + 26: ("Bafia", "ksf"), + 27: ("Balinese", "ban"), + 28: ("Bambara", "bm"), + 29: ("Bamun", "bax"), + 30: ("Bangla", "bn"), + 31: ("Basaa", "bas"), + 32: ("Bashkir", "ba"), + 33: ("Basque", "eu"), + 34: ("Batak Toba", "bbc"), + 35: ("Belarusian", "be"), + 36: ("Bemba", "bem"), + 37: ("Bena", "bez"), + 38: ("Bhojpuri", "bho"), + 39: ("Bislama", "bi"), + 40: ("Blin", "byn"), + 41: ("Bodo", "brx"), + 42: ("Bosnian", "bs"), + 43: ("Breton", "br"), + 44: ("Buginese", "bug"), + 45: ("Bulgarian", "bg"), + 46: ("Burmese", "my"), + 47: ("Cantonese", "yue"), + 48: ("Catalan", "ca"), + 49: ("Cebuano", "ceb"), + 50: ("Central Atlas Tamazight", "tzm"), + 51: ("Central Kurdish", "ckb"), + 52: ("Chakma", "ccp"), + 53: ("Chamorro", "ch"), + 54: ("Chechen", "ce"), + 55: ("Cherokee", "chr"), + 56: ("Chickasaw", "cic"), + 57: ("Chiga", "cgg"), + 58: ("Chinese", "zh"), # macrolanguage + 59: ("Church", "cu"), # macrolanguage + 60: ("Chuvash", "cv"), + 61: ("Colognian", "ksh"), + 62: ("Coptic", "cop"), + 63: ("Cornish", "kw"), + 64: ("Corsican", "co"), + 65: ("Cree", "cr"), # macrolanguage + 66: ("Croatian", "hr"), + 67: ("Czech", "cs"), + 68: ("Danish", "da"), + 69: ("Divehi", "dv"), + 70: ("Dogri", "doi"), # macrolanguage + 71: ("Duala", "dua"), + 72: ("Dutch", "nl"), + 73: ("Dzongkha", "dz"), + 74: ("Embu", "ebu"), + 75: ("English", "en"), + 76: ("Erzya", "myv"), + 77: ("Esperanto", "eo"), + 78: ("Estonian", "et"), # macrolanguage + 79: ("Ewe", "ee" ), + 80: ("Ewondo", "ewo"), + 81: ("Faroese", "fo"), + 82: ("Fijian", "fj"), + 83: ("Filipino", "fil"), + 84: ("Finnish", "fi"), + 85: ("French", "fr"), + 86: ("Friulian", "fur"), + 87: ("Fulah", "ff"), # macrolanguage + 88: ("Gaelic", "gd"), + 89: ("Ga", "gaa"), + 90: ("Galician", "gl"), + 91: ("Ganda", "lg"), + 92: ("Geez", "gez"), + 93: ("Georgian", "ka"), + 94: ("German", "de"), + 95: ("Gothic", "got"), + 96: ("Greek", "el"), + 97: ("Guarani", "gn"), # macrolanguage + 98: ("Gujarati", "gu"), + 99: ("Gusii", "guz"), + 100: ("Haitian", "ht"), + 101: ("Hausa", "ha"), + 102: ("Hawaiian", "haw"), + 103: ("Hebrew", "he"), + 104: ("Herero", "hz"), + 105: ("Hindi", "hi"), + 106: ("Hiri Motu", "ho"), + 107: ("Hungarian", "hu"), + 108: ("Icelandic", "is"), + 109: ("Ido", "io"), + 110: ("Igbo", "ig" ), + 111: ("Inari Sami", "smn"), + 112: ("Indonesian", "id"), + 113: ("Ingush", "inh"), + 114: ("Interlingua", "ia"), + 115: ("Interlingue", "ie"), + 116: ("Inuktitut", "iu"), # macrolanguage + 117: ("Inupiaq", "ik"), # macrolanguage + 118: ("Irish", "ga"), + 119: ("Italian", "it"), + 120: ("Japanese", "ja"), + 121: ("Javanese", "jv"), + 122: ("Jju", "kaj"), + 123: ("Jola Fonyi", "dyo"), + 124: ("Kabuverdianu", "kea"), + 125: ("Kabyle", "kab"), + 126: ("Kako", "kkj"), + 127: ("Kalaallisut", "kl"), + 128: ("Kalenjin", "kln"), + 129: ("Kamba", "kam"), + 130: ("Kannada", "kn"), + 131: ("Kanuri", "kr"), # macrolanguage + 132: ("Kashmiri", "ks"), + 133: ("Kazakh", "kk"), + 134: ("Kenyang", "ken"), + 135: ("Khmer", "km"), + 136: ("Kiche", "quc"), + 137: ("Kikuyu", "ki"), + 138: ("Kinyarwanda", "rw"), + 139: ("Komi", "kv"), # macrolanguage + 140: ("Kongo", "kg"), # macrolanguage + 141: ("Konkani", "kok"), + 142: ("Korean", "ko"), + 143: ("Koro", "kfo"), + 144: ("Koyraboro Senni", "ses"), + 145: ("Koyra Chiini", "khq"), + 146: ("Kpelle", "kpe"), + 147: ("Kuanyama", "kj"), + 148: ("Kurdish", "ku"), # macrolanguage + 149: ("Kwasio", "nmg"), + 150: ("Kyrgyz", "ky"), + 151: ("Lakota", "lkt"), + 152: ("Langi", "lag"), + 153: ("Lao", "lo"), + 154: ("Latin", "la"), + 155: ("Latvian", "lv"), # macrolanguage + 156: ("Lezghian", "lez"), + 157: ("Limburgish", "li"), + 158: ("Lingala", "ln"), + 159: ("Literary Chinese", "lzh"), + 160: ("Lithuanian", "lt"), + 161: ("Lojban", "jbo"), + 162: ("Lower Sorbian", "dsb"), + 163: ("Low German", "nds"), + 164: ("Luba Katanga", "lu"), + 165: ("Lule Sami", "smj"), + 166: ("Luo", "luo"), + 167: ("Luxembourgish", "lb"), + 168: ("Luyia", "luy"), + 169: ("Macedonian", "mk"), + 170: ("Machame", "jmc"), + 171: ("Maithili", "mai"), + 172: ("Makhuwa Meetto", "mgh"), + 173: ("Makonde", "kde"), + 174: ("Malagasy", "mg"), # macrolanguage + 175: ("Malayalam", "ml"), + 176: ("Malay", "ms"), # macrolanguage + 177: ("Maltese", "mt"), + 178: ("Mandingo", "man"), # macrolanguage + 179: ("Manipuri", "mni"), + 180: ("Manx", "gv"), + 181: ("Maori", "mi"), + 182: ("Mapuche", "arn"), + 183: ("Marathi", "mr"), + 184: ("Marshallese", "mh"), + 185: ("Masai", "mas"), + 186: ("Mazanderani", "mzn"), + 187: ("Mende", "men"), + 188: ("Meru", "mer"), + 189: ("Meta", "mgo"), + 190: ("Mohawk", "moh"), + 191: ("Mongolian", "mn"), # macrolanguage + 192: ("Morisyen", "mfe"), + 193: ("Mundang", "mua"), + 194: ("Muscogee", "mus"), + 195: ("Nama", "naq"), + 196: ("Nauru", "na"), + 197: ("Navajo", "nv"), + 198: ("Ndonga", "ng"), + 199: ("Nepali", "ne"), # macrolanguage + 200: ("Newari", "new"), + 201: ("Ngiemboon", "nnh"), + 202: ("Ngomba", "jgo"), + 203: ("Nigerian Pidgin", "pcm"), + 204: ("Nko", "nqo"), + 205: ("Northern Luri", "lrc"), + 206: ("Northern Sami", "se" ), + 207: ("Northern Sotho", "nso"), + 208: ("North Ndebele", "nd"), + 209: ("Norwegian Bokmal", "nb"), + 210: ("Norwegian Nynorsk", "nn"), + 211: ("Nuer", "nus"), + 212: ("Nyanja", "ny" ), + 213: ("Nyankole", "nyn"), + 214: ("Occitan", "oc"), + 215: ("Odia", "or"), # macrolanguage + 216: ("Ojibwa", "oj"), # macrolanguage + 217: ("Old Irish", "sga"), + 218: ("Old Norse", "non"), + 219: ("Old Persian", "peo"), + 220: ("Oromo", "om"), # macrolanguage + 221: ("Osage", "osa"), + 222: ("Ossetic", "os"), + 223: ("Pahlavi", "pal"), + 224: ("Palauan", "pau"), + 225: ("Pali", "pi"), # macrolanguage + 226: ("Papiamento", "pap"), + 227: ("Pashto", "ps"), # macrolanguage + 228: ("Persian", "fa"), # macrolanguage + 229: ("Phoenician", "phn"), + 230: ("Polish", "pl"), + 231: ("Portuguese", "pt"), + 232: ("Prussian", "prg"), + 233: ("Punjabi", "pa"), + 234: ("Quechua", "qu"), # macrolanguage + 235: ("Romanian", "ro"), + 236: ("Romansh", "rm"), + 237: ("Rombo", "rof"), + 238: ("Rundi", "rn"), + 239: ("Russian", "ru"), + 240: ("Rwa", "rwk"), + 241: ("Saho", "ssy"), + 242: ("Sakha", "sah"), + 243: ("Samburu", "saq"), + 244: ("Samoan", "sm"), + 245: ("Sango", "sg"), + 246: ("Sangu", "sbp"), + 247: ("Sanskrit", "sa"), + 248: ("Santali", "sat"), + 249: ("Sardinian", "sc"), # macrolanguage + 250: ("Saurashtra", "saz"), + 251: ("Sena", "seh"), + 252: ("Serbian", "sr"), + 253: ("Shambala", "ksb"), + 254: ("Shona", "sn"), + 255: ("Sichuan Yi", "ii" ), + 256: ("Sicilian", "scn"), + 257: ("Sidamo", "sid"), + 258: ("Silesian", "szl"), + 259: ("Sindhi", "sd"), + 260: ("Sinhala", "si"), + 261: ("Skolt Sami", "sms"), + 262: ("Slovak", "sk"), + 263: ("Slovenian", "sl"), + 264: ("Soga", "xog"), + 265: ("Somali", "so"), + 266: ("Southern Kurdish", "sdh"), + 267: ("Southern Sami", "sma"), + 268: ("Southern Sotho", "st"), + 269: ("South Ndebele", "nr" ), + 270: ("Spanish", "es"), + 271: ("Standard Moroccan Tamazight", "zgh"), + 272: ("Sundanese", "su"), + 273: ("Swahili", "sw"), # macrolanguage + 274: ("Swati", "ss"), + 275: ("Swedish", "sv"), + 276: ("Swiss German", "gsw"), + 277: ("Syriac", "syr"), + 278: ("Tachelhit", "shi"), + 279: ("Tahitian", "ty"), + 280: ("Tai Dam", "blt"), + 281: ("Taita", "dav"), + 282: ("Tajik", "tg"), + 283: ("Tamil", "ta"), + 284: ("Taroko", "trv"), + 285: ("Tasawaq", "twq"), + 286: ("Tatar", "tt"), + 287: ("Telugu", "te"), + 288: ("Teso", "teo"), + 289: ("Thai", "th"), + 290: ("Tibetan", "bo"), + 291: ("Tigre", "tig"), + 292: ("Tigrinya", "ti"), + 293: ("Tokelau", "tkl"), + 294: ("Tok Pisin", "tpi"), + 295: ("Tongan", "to"), + 296: ("Tsonga", "ts"), + 297: ("Tswana", "tn"), + 298: ("Turkish", "tr"), + 299: ("Turkmen", "tk"), + 300: ("Tuvalu", "tvl"), + 301: ("Tyap", "kcg"), + 302: ("Ugaritic", "uga"), + 303: ("Ukrainian", "uk"), + 304: ("Upper Sorbian", "hsb"), + 305: ("Urdu", "ur"), + 306: ("Uyghur", "ug"), + 307: ("Uzbek", "uz"), # macrolanguage + 308: ("Vai", "vai"), + 309: ("Venda", "ve" ), + 310: ("Vietnamese", "vi"), + 311: ("Volapuk", "vo"), + 312: ("Vunjo", "vun"), + 313: ("Walloon", "wa"), + 314: ("Walser", "wae"), + 315: ("Warlpiri", "wbp"), + 316: ("Welsh", "cy"), + 317: ("Western Balochi", "bgn"), + 318: ("Western Frisian", "fy"), + 319: ("Wolaytta", "wal"), + 320: ("Wolof", "wo"), + 321: ("Xhosa", "xh"), + 322: ("Yangben", "yav"), + 323: ("Yiddish", "yi"), # macrolanguage + 324: ("Yoruba", "yo"), + 325: ("Zarma", "dje"), + 326: ("Zhuang", "za"), # macrolanguage + 327: ("Zulu", "zu"), } language_aliases = { @@ -399,271 +404,272 @@ language_aliases = { } country_list = { - 0: ["AnyCountry", "ZZ"], - 1: ["Afghanistan", "AF"], - 2: ["Albania", "AL"], - 3: ["Algeria", "DZ"], - 4: ["American Samoa", "AS"], - 5: ["Andorra", "AD"], - 6: ["Angola", "AO"], - 7: ["Anguilla", "AI"], - 8: ["Antarctica", "AQ"], - 9: ["Antigua And Barbuda", "AG"], - 10: ["Argentina", "AR"], - 11: ["Armenia", "AM"], - 12: ["Aruba", "AW"], - 13: ["Australia", "AU"], - 14: ["Austria", "AT"], - 15: ["Azerbaijan", "AZ"], - 16: ["Bahamas", "BS"], - 17: ["Bahrain", "BH"], - 18: ["Bangladesh", "BD"], - 19: ["Barbados", "BB"], - 20: ["Belarus", "BY"], - 21: ["Belgium", "BE"], - 22: ["Belize", "BZ"], - 23: ["Benin", "BJ"], - 24: ["Bermuda", "BM"], - 25: ["Bhutan", "BT"], - 26: ["Bolivia", "BO"], - 27: ["Bosnia And Herzegovina", "BA"], - 28: ["Botswana", "BW"], - 29: ["Bouvet Island", "BV"], - 30: ["Brazil", "BR"], - 31: ["British Indian Ocean Territory", "IO"], - 32: ["Brunei", "BN"], - 33: ["Bulgaria", "BG"], - 34: ["Burkina Faso", "BF"], - 35: ["Burundi", "BI"], - 36: ["Cambodia", "KH"], - 37: ["Cameroon", "CM"], - 38: ["Canada", "CA"], - 39: ["Cape Verde", "CV"], - 40: ["Cayman Islands", "KY"], - 41: ["Central African Republic", "CF"], - 42: ["Chad", "TD"], - 43: ["Chile", "CL"], - 44: ["China", "CN"], - 45: ["Christmas Island", "CX"], - 46: ["Cocos Islands", "CC"], - 47: ["Colombia", "CO"], - 48: ["Comoros", "KM"], - 49: ["Congo Kinshasa", "CD"], - 50: ["Congo Brazzaville", "CG"], - 51: ["Cook Islands", "CK"], - 52: ["Costa Rica", "CR"], + 0: ("AnyCountry", "ZZ"), + + 1: ("Afghanistan", "AF"), + 2: ("Aland Islands", "AX"), + 3: ("Albania", "AL"), + 4: ("Algeria", "DZ"), + 5: ("American Samoa", "AS"), + 6: ("Andorra", "AD"), + 7: ("Angola", "AO"), + 8: ("Anguilla", "AI"), + 9: ("Antarctica", "AQ"), + 10: ("Antigua And Barbuda", "AG"), + 11: ("Argentina", "AR"), + 12: ("Armenia", "AM"), + 13: ("Aruba", "AW"), + 14: ("Ascension Island", "AC"), + 15: ("Australia", "AU"), + 16: ("Austria", "AT"), + 17: ("Azerbaijan", "AZ"), + 18: ("Bahamas", "BS"), + 19: ("Bahrain", "BH"), + 20: ("Bangladesh", "BD"), + 21: ("Barbados", "BB"), + 22: ("Belarus", "BY"), + 23: ("Belgium", "BE"), + 24: ("Belize", "BZ"), + 25: ("Benin", "BJ"), + 26: ("Bermuda", "BM"), + 27: ("Bhutan", "BT"), + 28: ("Bolivia", "BO"), + 29: ("Bosnia And Herzegovina", "BA"), + 30: ("Botswana", "BW"), + 31: ("Bouvet Island", "BV"), + 32: ("Brazil", "BR"), + 33: ("British Indian Ocean Territory", "IO"), + 34: ("British Virgin Islands", "VG"), + 35: ("Brunei", "BN"), + 36: ("Bulgaria", "BG"), + 37: ("Burkina Faso", "BF"), + 38: ("Burundi", "BI"), + 39: ("Cambodia", "KH"), + 40: ("Cameroon", "CM"), + 41: ("Canada", "CA"), + 42: ("Canary Islands", "IC"), + 43: ("Cape Verde", "CV"), + 44: ("Caribbean Netherlands", "BQ"), + 45: ("Cayman Islands", "KY"), + 46: ("Central African Republic", "CF"), + 47: ("Ceuta And Melilla", "EA"), + 48: ("Chad", "TD"), + 49: ("Chile", "CL"), + 50: ("China", "CN"), + 51: ("Christmas Island", "CX"), + 52: ("Clipperton Island", "CP"), + 53: ("Cocos Islands", "CC"), + 54: ("Colombia", "CO"), + 55: ("Comoros", "KM"), + 56: ("Congo Brazzaville", "CG"), + 57: ("Congo Kinshasa", "CD"), + 58: ("Cook Islands", "CK"), + 59: ("Costa Rica", "CR"), + 60: ("Croatia", "HR"), + 61: ("Cuba", "CU"), + 62: ("Curacao", "CW"), + 63: ("Cyprus", "CY"), + 64: ("Czechia", "CZ"), + 65: ("Denmark", "DK"), + 66: ("Diego Garcia", "DG"), + 67: ("Djibouti", "DJ"), + 68: ("Dominica", "DM"), + 69: ("Dominican Republic", "DO"), + 70: ("Ecuador", "EC"), + 71: ("Egypt", "EG"), + 72: ("El Salvador", "SV"), + 73: ("Equatorial Guinea", "GQ"), + 74: ("Eritrea", "ER"), + 75: ("Estonia", "EE"), + 76: ("Eswatini", "SZ"), + 77: ("Ethiopia", "ET"), + 78: ("Europe", "150"), + 79: ("European Union", "EU"), + 80: ("Falkland Islands", "FK"), + 81: ("Faroe Islands", "FO"), + 82: ("Fiji", "FJ"), + 83: ("Finland", "FI"), + 84: ("France", "FR"), + 85: ("French Guiana", "GF"), + 86: ("French Polynesia", "PF"), + 87: ("French Southern Territories", "TF"), + 88: ("Gabon", "GA"), + 89: ("Gambia", "GM"), + 90: ("Georgia", "GE"), + 91: ("Germany", "DE"), + 92: ("Ghana", "GH"), + 93: ("Gibraltar", "GI"), + 94: ("Greece", "GR"), + 95: ("Greenland", "GL"), + 96: ("Grenada", "GD"), + 97: ("Guadeloupe", "GP"), + 98: ("Guam", "GU"), + 99: ("Guatemala", "GT"), + 100: ("Guernsey", "GG"), + 101: ("Guinea Bissau", "GW"), + 102: ("Guinea", "GN"), + 103: ("Guyana", "GY"), + 104: ("Haiti", "HT"), + 105: ("Heard And McDonald Islands", "HM"), + 106: ("Honduras", "HN"), + 107: ("Hong Kong", "HK"), + 108: ("Hungary", "HU"), + 109: ("Iceland", "IS"), + 110: ("India", "IN"), + 111: ("Indonesia", "ID"), + 112: ("Iran", "IR"), + 113: ("Iraq", "IQ"), + 114: ("Ireland", "IE"), + 115: ("Isle Of Man", "IM"), + 116: ("Israel", "IL"), + 117: ("Italy", "IT"), # Officially Côte d’Ivoire, which we'd ned to map to CotedIvoire # or CoteDIvoire, either failing to make the d' separate from # Cote or messing with its case. So stick with Ivory Coast: - 53: ["Ivory Coast", "CI"], - 54: ["Croatia", "HR"], - 55: ["Cuba", "CU"], - 56: ["Cyprus", "CY"], - 57: ["Czechia", "CZ"], - 58: ["Denmark", "DK"], - 59: ["Djibouti", "DJ"], - 60: ["Dominica", "DM"], - 61: ["Dominican Republic", "DO"], - 62: ["Timor-Leste", "TL"], - 63: ["Ecuador", "EC"], - 64: ["Egypt", "EG"], - 65: ["El Salvador", "SV"], - 66: ["Equatorial Guinea", "GQ"], - 67: ["Eritrea", "ER"], - 68: ["Estonia", "EE"], - 69: ["Ethiopia", "ET"], - 70: ["Falkland Islands", "FK"], - 71: ["Faroe Islands", "FO"], - 72: ["Fiji", "FJ"], - 73: ["Finland", "FI"], - 74: ["France", "FR"], - 75: ["Guernsey", "GG"], - 76: ["French Guiana", "GF"], - 77: ["French Polynesia", "PF"], - 78: ["French Southern Territories", "TF"], - 79: ["Gabon", "GA"], - 80: ["Gambia", "GM"], - 81: ["Georgia", "GE"], - 82: ["Germany", "DE"], - 83: ["Ghana", "GH"], - 84: ["Gibraltar", "GI"], - 85: ["Greece", "GR"], - 86: ["Greenland", "GL"], - 87: ["Grenada", "GD"], - 88: ["Guadeloupe", "GP"], - 89: ["Guam", "GU"], - 90: ["Guatemala", "GT"], - 91: ["Guinea", "GN"], - 92: ["Guinea Bissau", "GW"], - 93: ["Guyana", "GY"], - 94: ["Haiti", "HT"], - 95: ["Heard And McDonald Islands", "HM"], - 96: ["Honduras", "HN"], - 97: ["Hong Kong", "HK"], - 98: ["Hungary", "HU"], - 99: ["Iceland", "IS"], - 100: ["India", "IN"], - 101: ["Indonesia", "ID"], - 102: ["Iran", "IR"], - 103: ["Iraq", "IQ"], - 104: ["Ireland", "IE"], - 105: ["Israel", "IL"], - 106: ["Italy", "IT"], - 107: ["Jamaica", "JM"], - 108: ["Japan", "JP"], - 109: ["Jordan", "JO"], - 110: ["Kazakhstan", "KZ"], - 111: ["Kenya", "KE"], - 112: ["Kiribati", "KI"], - 113: ["North Korea", "KP"], - 114: ["South Korea", "KR"], - 115: ["Kuwait", "KW"], - 116: ["Kyrgyzstan", "KG"], - 117: ["Laos", "LA"], - 118: ["Latvia", "LV"], - 119: ["Lebanon", "LB"], - 120: ["Lesotho", "LS"], - 121: ["Liberia", "LR"], - 122: ["Libya", "LY"], - 123: ["Liechtenstein", "LI"], - 124: ["Lithuania", "LT"], - 125: ["Luxembourg", "LU"], - 126: ["Macao", "MO"], - 127: ["Macedonia", "MK"], - 128: ["Madagascar", "MG"], - 129: ["Malawi", "MW"], - 130: ["Malaysia", "MY"], - 131: ["Maldives", "MV"], - 132: ["Mali", "ML"], - 133: ["Malta", "MT"], - 134: ["Marshall Islands", "MH"], - 135: ["Martinique", "MQ"], - 136: ["Mauritania", "MR"], - 137: ["Mauritius", "MU"], - 138: ["Mayotte", "YT"], - 139: ["Mexico", "MX"], - 140: ["Micronesia", "FM"], - 141: ["Moldova", "MD"], - 142: ["Monaco", "MC"], - 143: ["Mongolia", "MN"], - 144: ["Montserrat", "MS"], - 145: ["Morocco", "MA"], - 146: ["Mozambique", "MZ"], - 147: ["Myanmar", "MM"], - 148: ["Namibia", "NA"], - 149: ["Nauru", "NR"], - 150: ["Nepal", "NP"], - 151: ["Netherlands", "NL"], - 152: ["Curacao", "CW"], - 153: ["New Caledonia", "NC"], - 154: ["New Zealand", "NZ"], - 155: ["Nicaragua", "NI"], - 156: ["Niger", "NE"], - 157: ["Nigeria", "NG"], - 158: ["Niue", "NU"], - 159: ["Norfolk Island", "NF"], - 160: ["Northern Mariana Islands", "MP"], - 161: ["Norway", "NO"], - 162: ["Oman", "OM"], - 163: ["Pakistan", "PK"], - 164: ["Palau", "PW"], - 165: ["Palestinian Territories", "PS"], - 166: ["Panama", "PA"], - 167: ["Papua New Guinea", "PG"], - 168: ["Paraguay", "PY"], - 169: ["Peru", "PE"], - 170: ["Philippines", "PH"], - 171: ["Pitcairn", "PN"], - 172: ["Poland", "PL"], - 173: ["Portugal", "PT"], - 174: ["Puerto Rico", "PR"], - 175: ["Qatar", "QA"], - 176: ["Reunion", "RE"], - 177: ["Romania", "RO"], - 178: ["Russia", "RU"], - 179: ["Rwanda", "RW"], - 180: ["Saint Kitts And Nevis", "KN"], - 181: ["Saint Lucia", "LC"], - 182: ["Saint Vincent And Grenadines", "VC"], - 183: ["Samoa", "WS"], - 184: ["San Marino", "SM"], - 185: ["Sao Tome And Principe", "ST"], - 186: ["Saudi Arabia", "SA"], - 187: ["Senegal", "SN"], - 188: ["Seychelles", "SC"], - 189: ["Sierra Leone", "SL"], - 190: ["Singapore", "SG"], - 191: ["Slovakia", "SK"], - 192: ["Slovenia", "SI"], - 193: ["Solomon Islands", "SB"], - 194: ["Somalia", "SO"], - 195: ["South Africa", "ZA"], - 196: ["South Georgia And South Sandwich Islands", "GS"], - 197: ["Spain", "ES"], - 198: ["Sri Lanka", "LK"], - 199: ["Saint Helena", "SH"], - 200: ["Saint Pierre And Miquelon", "PM"], - 201: ["Sudan", "SD"], - 202: ["Suriname", "SR"], - 203: ["Svalbard And Jan Mayen", "SJ"], - 204: ["Eswatini", "SZ"], - 205: ["Sweden", "SE"], - 206: ["Switzerland", "CH"], - 207: ["Syria", "SY"], - 208: ["Taiwan", "TW"], - 209: ["Tajikistan", "TJ"], - 210: ["Tanzania", "TZ"], - 211: ["Thailand", "TH"], - 212: ["Togo", "TG"], - 213: ["Tokelau", "TK"], - 214: ["Tonga", "TO"], - 215: ["Trinidad And Tobago", "TT"], - 216: ["Tunisia", "TN"], - 217: ["Turkey", "TR"], - 218: ["Turkmenistan", "TM"], - 219: ["Turks And Caicos Islands", "TC"], - 220: ["Tuvalu", "TV"], - 221: ["Uganda", "UG"], - 222: ["Ukraine", "UA"], - 223: ["United Arab Emirates", "AE"], - 224: ["United Kingdom", "GB"], - 225: ["United States", "US"], - 226: ["United States Outlying Islands", "UM"], - 227: ["Uruguay", "UY"], - 228: ["Uzbekistan", "UZ"], - 229: ["Vanuatu", "VU"], - 230: ["Vatican City", "VA"], - 231: ["Venezuela", "VE"], - 232: ["Vietnam", "VN"], - 233: ["British Virgin Islands", "VG"], - 234: ["United States Virgin Islands", "VI"], - 235: ["Wallis And Futuna", "WF"], - 236: ["Western Sahara", "EH"], - 237: ["Yemen", "YE"], - 238: ["Canary Islands", "IC"], - 239: ["Zambia", "ZM"], - 240: ["Zimbabwe", "ZW"], - 241: ["Clipperton Island", "CP"], - 242: ["Montenegro", "ME"], - 243: ["Serbia", "RS"], - 244: ["Saint Barthelemy", "BL"], - 245: ["Saint Martin", "MF"], - 246: ["Latin America", "419"], - 247: ["Ascension Island", "AC"], - 248: ["Aland Islands", "AX"], - 249: ["Diego Garcia", "DG"], - 250: ["Ceuta And Melilla", "EA"], - 251: ["Isle Of Man", "IM"], - 252: ["Jersey", "JE"], - 253: ["Tristan Da Cunha", "TA"], - 254: ["South Sudan", "SS"], - 255: ["Caribbean Netherlands", "BQ"], - 256: ["Sint Maarten", "SX"], - 257: ["Kosovo", "XK"], - 258: ["European Union", "EU"], - 259: ["Outlying Oceania", "QO"], - 260: ["World", "001"], - 261: ["Europe", "150"], + 118: ("Ivory Coast", "CI"), + 119: ("Jamaica", "JM"), + 120: ("Japan", "JP"), + 121: ("Jersey", "JE"), + 122: ("Jordan", "JO"), + 123: ("Kazakhstan", "KZ"), + 124: ("Kenya", "KE"), + 125: ("Kiribati", "KI"), + 126: ("Kosovo", "XK"), + 127: ("Kuwait", "KW"), + 128: ("Kyrgyzstan", "KG"), + 129: ("Laos", "LA"), + 130: ("Latin America", "419"), + 131: ("Latvia", "LV"), + 132: ("Lebanon", "LB"), + 133: ("Lesotho", "LS"), + 134: ("Liberia", "LR"), + 135: ("Libya", "LY"), + 136: ("Liechtenstein", "LI"), + 137: ("Lithuania", "LT"), + 138: ("Luxembourg", "LU"), + 139: ("Macao", "MO"), + 140: ("Macedonia", "MK"), + 141: ("Madagascar", "MG"), + 142: ("Malawi", "MW"), + 143: ("Malaysia", "MY"), + 144: ("Maldives", "MV"), + 145: ("Mali", "ML"), + 146: ("Malta", "MT"), + 147: ("Marshall Islands", "MH"), + 148: ("Martinique", "MQ"), + 149: ("Mauritania", "MR"), + 150: ("Mauritius", "MU"), + 151: ("Mayotte", "YT"), + 152: ("Mexico", "MX"), + 153: ("Micronesia", "FM"), + 154: ("Moldova", "MD"), + 155: ("Monaco", "MC"), + 156: ("Mongolia", "MN"), + 157: ("Montenegro", "ME"), + 158: ("Montserrat", "MS"), + 159: ("Morocco", "MA"), + 160: ("Mozambique", "MZ"), + 161: ("Myanmar", "MM"), + 162: ("Namibia", "NA"), + 163: ("Nauru", "NR"), + 164: ("Nepal", "NP"), + 165: ("Netherlands", "NL"), + 166: ("New Caledonia", "NC"), + 167: ("New Zealand", "NZ"), + 168: ("Nicaragua", "NI"), + 169: ("Nigeria", "NG"), + 170: ("Niger", "NE"), + 171: ("Niue", "NU"), + 172: ("Norfolk Island", "NF"), + 173: ("Northern Mariana Islands", "MP"), + 174: ("North Korea", "KP"), + 175: ("Norway", "NO"), + 176: ("Oman", "OM"), + 177: ("Outlying Oceania", "QO"), + 178: ("Pakistan", "PK"), + 179: ("Palau", "PW"), + 180: ("Palestinian Territories", "PS"), + 181: ("Panama", "PA"), + 182: ("Papua New Guinea", "PG"), + 183: ("Paraguay", "PY"), + 184: ("Peru", "PE"), + 185: ("Philippines", "PH"), + 186: ("Pitcairn", "PN"), + 187: ("Poland", "PL"), + 188: ("Portugal", "PT"), + 189: ("Puerto Rico", "PR"), + 190: ("Qatar", "QA"), + 191: ("Reunion", "RE"), + 192: ("Romania", "RO"), + 193: ("Russia", "RU"), + 194: ("Rwanda", "RW"), + 195: ("Saint Barthelemy", "BL"), + 196: ("Saint Helena", "SH"), + 197: ("Saint Kitts And Nevis", "KN"), + 198: ("Saint Lucia", "LC"), + 199: ("Saint Martin", "MF"), + 200: ("Saint Pierre And Miquelon", "PM"), + 201: ("Saint Vincent And Grenadines", "VC"), + 202: ("Samoa", "WS"), + 203: ("San Marino", "SM"), + 204: ("Sao Tome And Principe", "ST"), + 205: ("Saudi Arabia", "SA"), + 206: ("Senegal", "SN"), + 207: ("Serbia", "RS"), + 208: ("Seychelles", "SC"), + 209: ("Sierra Leone", "SL"), + 210: ("Singapore", "SG"), + 211: ("Sint Maarten", "SX"), + 212: ("Slovakia", "SK"), + 213: ("Slovenia", "SI"), + 214: ("Solomon Islands", "SB"), + 215: ("Somalia", "SO"), + 216: ("South Africa", "ZA"), + 217: ("South Georgia And South Sandwich Islands", "GS"), + 218: ("South Korea", "KR"), + 219: ("South Sudan", "SS"), + 220: ("Spain", "ES"), + 221: ("Sri Lanka", "LK"), + 222: ("Sudan", "SD"), + 223: ("Suriname", "SR"), + 224: ("Svalbard And Jan Mayen", "SJ"), + 225: ("Sweden", "SE"), + 226: ("Switzerland", "CH"), + 227: ("Syria", "SY"), + 228: ("Taiwan", "TW"), + 229: ("Tajikistan", "TJ"), + 230: ("Tanzania", "TZ"), + 231: ("Thailand", "TH"), + 232: ("Timor-Leste", "TL"), + 233: ("Togo", "TG"), + 234: ("Tokelau", "TK"), + 235: ("Tonga", "TO"), + 236: ("Trinidad And Tobago", "TT"), + 237: ("Tristan Da Cunha", "TA"), + 238: ("Tunisia", "TN"), + 239: ("Turkey", "TR"), + 240: ("Turkmenistan", "TM"), + 241: ("Turks And Caicos Islands", "TC"), + 242: ("Tuvalu", "TV"), + 243: ("Uganda", "UG"), + 244: ("Ukraine", "UA"), + 245: ("United Arab Emirates", "AE"), + 246: ("United Kingdom", "GB"), + 247: ("United States Outlying Islands", "UM"), + 248: ("United States", "US"), + 249: ("United States Virgin Islands", "VI"), + 250: ("Uruguay", "UY"), + 251: ("Uzbekistan", "UZ"), + 252: ("Vanuatu", "VU"), + 253: ("Vatican City", "VA"), + 254: ("Venezuela", "VE"), + 255: ("Vietnam", "VN"), + 256: ("Wallis And Futuna", "WF"), + 257: ("Western Sahara", "EH"), + 258: ("World", "001"), + 259: ("Yemen", "YE"), + 260: ("Zambia", "ZM"), + 261: ("Zimbabwe", "ZW"), } country_aliases = { @@ -692,148 +698,149 @@ country_aliases = { } script_list = { - 0: ["AnyScript", "Zzzz"], - 1: ["Arabic", "Arab"], - 2: ["Cyrillic", "Cyrl"], - 3: ["Deseret", "Dsrt"], - 4: ["Gurmukhi", "Guru"], - 5: ["Simplified Han", "Hans"], - 6: ["Traditional Han", "Hant"], - 7: ["Latin", "Latn"], - 8: ["Mongolian", "Mong"], - 9: ["Tifinagh", "Tfng"], - 10: ["Armenian", "Armn"], - 11: ["Bangla", "Beng"], - 12: ["Cherokee", "Cher"], - 13: ["Devanagari", "Deva"], - 14: ["Ethiopic", "Ethi"], - 15: ["Georgian", "Geor"], - 16: ["Greek", "Grek"], - 17: ["Gujarati", "Gujr"], - 18: ["Hebrew", "Hebr"], - 19: ["Japanese", "Jpan"], - 20: ["Khmer", "Khmr"], - 21: ["Kannada", "Knda"], - 22: ["Korean", "Kore"], - 23: ["Lao", "Laoo"], - 24: ["Malayalam", "Mlym"], - 25: ["Myanmar", "Mymr"], - 26: ["Odia", "Orya"], - 27: ["Tamil", "Taml"], - 28: ["Telugu", "Telu"], - 29: ["Thaana", "Thaa"], - 30: ["Thai", "Thai"], - 31: ["Tibetan", "Tibt"], - 32: ["Sinhala", "Sinh"], - 33: ["Syriac", "Syrc"], - 34: ["Yi", "Yiii"], - 35: ["Vai", "Vaii"], - 36: ["Avestan", "Avst"], - 37: ["Balinese", "Bali"], - 38: ["Bamum", "Bamu"], - 39: ["Batak", "Batk"], - 40: ["Bopomofo", "Bopo"], - 41: ["Brahmi", "Brah"], - 42: ["Buginese", "Bugi"], - 43: ["Buhid", "Buhd"], - 44: ["Canadian Aboriginal", "Cans"], - 45: ["Carian", "Cari"], - 46: ["Chakma", "Cakm"], - 47: ["Cham", "Cham"], - 48: ["Coptic", "Copt"], - 49: ["Cypriot", "Cprt"], - 50: ["Egyptian Hieroglyphs", "Egyp"], - 51: ["Fraser", "Lisu"], - 52: ["Glagolitic", "Glag"], - 53: ["Gothic", "Goth"], - 54: ["Han", "Hani"], - 55: ["Hangul", "Hang"], - 56: ["Hanunoo", "Hano"], - 57: ["Imperial Aramaic", "Armi"], - 58: ["Inscriptional Pahlavi", "Phli"], - 59: ["Inscriptional Parthian", "Prti"], - 60: ["Javanese", "Java"], - 61: ["Kaithi", "Kthi"], - 62: ["Katakana", "Kana"], - 63: ["Kayah Li", "Kali"], - 64: ["Kharoshthi", "Khar"], - 65: ["Lanna", "Lana"], - 66: ["Lepcha", "Lepc"], - 67: ["Limbu", "Limb"], - 68: ["Linear B", "Linb"], - 69: ["Lycian", "Lyci"], - 70: ["Lydian", "Lydi"], - 71: ["Mandaean", "Mand"], - 72: ["Meitei Mayek", "Mtei"], - 73: ["Meroitic", "Mero"], - 74: ["Meroitic Cursive", "Merc"], - 75: ["Nko", "Nkoo"], - 76: ["New Tai Lue", "Talu"], - 77: ["Ogham", "Ogam"], - 78: ["Ol Chiki", "Olck"], - 79: ["Old Italic", "Ital"], - 80: ["Old Persian", "Xpeo"], - 81: ["Old South Arabian", "Sarb"], - 82: ["Orkhon", "Orkh"], - 83: ["Osmanya", "Osma"], - 84: ["Phags Pa", "Phag"], - 85: ["Phoenician", "Phnx"], - 86: ["Pollard Phonetic", "Plrd"], - 87: ["Rejang", "Rjng"], - 88: ["Runic", "Runr"], - 89: ["Samaritan", "Samr"], - 90: ["Saurashtra", "Saur"], - 91: ["Sharada", "Shrd"], - 92: ["Shavian", "Shaw"], - 93: ["Sora Sompeng", "Sora"], - 94: ["Cuneiform", "Xsux"], - 95: ["Sundanese", "Sund"], - 96: ["Syloti Nagri", "Sylo"], - 97: ["Tagalog", "Tglg"], - 98: ["Tagbanwa", "Tagb"], - 99: ["Tai Le", "Tale"], - 100: ["Tai Viet", "Tavt"], - 101: ["Takri", "Takr"], - 102: ["Ugaritic", "Ugar"], - 103: ["Braille", "Brai"], - 104: ["Hiragana", "Hira"], - 105: ["Caucasian Albanian", "Aghb"], - 106: ["Bassa Vah", "Bass"], - 107: ["Duployan", "Dupl"], - 108: ["Elbasan", "Elba"], - 109: ["Grantha", "Gran"], - 110: ["Pahawh Hmong", "Hmng"], - 111: ["Khojki", "Khoj"], - 112: ["Linear A", "Lina"], - 113: ["Mahajani", "Mahj"], - 114: ["Manichaean", "Mani"], - 115: ["Mende", "Mend"], - 116: ["Modi", "Modi"], - 117: ["Mro", "Mroo"], - 118: ["Old North Arabian", "Narb"], - 119: ["Nabataean", "Nbat"], - 120: ["Palmyrene", "Palm"], - 121: ["Pau Cin Hau", "Pauc"], - 122: ["Old Permic", "Perm"], - 123: ["Psalter Pahlavi", "Phlp"], - 124: ["Siddham", "Sidd"], - 125: ["Khudawadi", "Sind"], - 126: ["Tirhuta", "Tirh"], - 127: ["Varang Kshiti", "Wara"], - 128: ["Ahom", "Ahom"], - 129: ["Anatolian Hieroglyphs", "Hluw"], - 130: ["Hatran", "Hatr"], - 131: ["Multani", "Mult"], - 132: ["Old Hungarian", "Hung"], - 133: ["Sign Writing", "Sgnw"], - 134: ["Adlam", "Adlm"], - 135: ["Bhaiksuki", "Bhks"], - 136: ["Marchen", "Marc"], - 137: ["Newa", "Newa"], - 138: ["Osage", "Osge"], - 139: ["Tangut", "Tang"], - 140: ["Han with Bopomofo", "Hanb"], - 141: ["Jamo", "Jamo"], + 0: ("AnyScript", "Zzzz"), + + 1: ("Adlam", "Adlm"), + 2: ("Ahom", "Ahom"), + 3: ("Anatolian Hieroglyphs", "Hluw"), + 4: ("Arabic", "Arab"), + 5: ("Armenian", "Armn"), + 6: ("Avestan", "Avst"), + 7: ("Balinese", "Bali"), + 8: ("Bamum", "Bamu"), + 9: ("Bangla", "Beng"), + 10: ("Bassa Vah", "Bass"), + 11: ("Batak", "Batk"), + 12: ("Bhaiksuki", "Bhks"), + 13: ("Bopomofo", "Bopo"), + 14: ("Brahmi", "Brah"), + 15: ("Braille", "Brai"), + 16: ("Buginese", "Bugi"), + 17: ("Buhid", "Buhd"), + 18: ("Canadian Aboriginal", "Cans"), + 19: ("Carian", "Cari"), + 20: ("Caucasian Albanian", "Aghb"), + 21: ("Chakma", "Cakm"), + 22: ("Cham", "Cham"), + 23: ("Cherokee", "Cher"), + 24: ("Coptic", "Copt"), + 25: ("Cuneiform", "Xsux"), + 26: ("Cypriot", "Cprt"), + 27: ("Cyrillic", "Cyrl"), + 28: ("Deseret", "Dsrt"), + 29: ("Devanagari", "Deva"), + 30: ("Duployan", "Dupl"), + 31: ("Egyptian Hieroglyphs", "Egyp"), + 32: ("Elbasan", "Elba"), + 33: ("Ethiopic", "Ethi"), + 34: ("Fraser", "Lisu"), + 35: ("Georgian", "Geor"), + 36: ("Glagolitic", "Glag"), + 37: ("Gothic", "Goth"), + 38: ("Grantha", "Gran"), + 39: ("Greek", "Grek"), + 40: ("Gujarati", "Gujr"), + 41: ("Gurmukhi", "Guru"), + 42: ("Hangul", "Hang"), + 43: ("Han", "Hani"), + 44: ("Hanunoo", "Hano"), + 45: ("Han with Bopomofo", "Hanb"), + 46: ("Hatran", "Hatr"), + 47: ("Hebrew", "Hebr"), + 48: ("Hiragana", "Hira"), + 49: ("Imperial Aramaic", "Armi"), + 50: ("Inscriptional Pahlavi", "Phli"), + 51: ("Inscriptional Parthian", "Prti"), + 52: ("Jamo", "Jamo"), + 53: ("Japanese", "Jpan"), + 54: ("Javanese", "Java"), + 55: ("Kaithi", "Kthi"), + 56: ("Kannada", "Knda"), + 57: ("Katakana", "Kana"), + 58: ("Kayah Li", "Kali"), + 59: ("Kharoshthi", "Khar"), + 60: ("Khmer", "Khmr"), + 61: ("Khojki", "Khoj"), + 62: ("Khudawadi", "Sind"), + 63: ("Korean", "Kore"), + 64: ("Lanna", "Lana"), + 65: ("Lao", "Laoo"), + 66: ("Latin", "Latn"), + 67: ("Lepcha", "Lepc"), + 68: ("Limbu", "Limb"), + 69: ("Linear A", "Lina"), + 70: ("Linear B", "Linb"), + 71: ("Lycian", "Lyci"), + 72: ("Lydian", "Lydi"), + 73: ("Mahajani", "Mahj"), + 74: ("Malayalam", "Mlym"), + 75: ("Mandaean", "Mand"), + 76: ("Manichaean", "Mani"), + 77: ("Marchen", "Marc"), + 78: ("Meitei Mayek", "Mtei"), + 79: ("Mende", "Mend"), + 80: ("Meroitic Cursive", "Merc"), + 81: ("Meroitic", "Mero"), + 82: ("Modi", "Modi"), + 83: ("Mongolian", "Mong"), + 84: ("Mro", "Mroo"), + 85: ("Multani", "Mult"), + 86: ("Myanmar", "Mymr"), + 87: ("Nabataean", "Nbat"), + 88: ("Newa", "Newa"), + 89: ("New Tai Lue", "Talu"), + 90: ("Nko", "Nkoo"), + 91: ("Odia", "Orya"), + 92: ("Ogham", "Ogam"), + 93: ("Ol Chiki", "Olck"), + 94: ("Old Hungarian", "Hung"), + 95: ("Old Italic", "Ital"), + 96: ("Old North Arabian", "Narb"), + 97: ("Old Permic", "Perm"), + 98: ("Old Persian", "Xpeo"), + 99: ("Old South Arabian", "Sarb"), + 100: ("Orkhon", "Orkh"), + 101: ("Osage", "Osge"), + 102: ("Osmanya", "Osma"), + 103: ("Pahawh Hmong", "Hmng"), + 104: ("Palmyrene", "Palm"), + 105: ("Pau Cin Hau", "Pauc"), + 106: ("Phags Pa", "Phag"), + 107: ("Phoenician", "Phnx"), + 108: ("Pollard Phonetic", "Plrd"), + 109: ("Psalter Pahlavi", "Phlp"), + 110: ("Rejang", "Rjng"), + 111: ("Runic", "Runr"), + 112: ("Samaritan", "Samr"), + 113: ("Saurashtra", "Saur"), + 114: ("Sharada", "Shrd"), + 115: ("Shavian", "Shaw"), + 116: ("Siddham", "Sidd"), + 117: ("Sign Writing", "Sgnw"), + 118: ("Simplified Han", "Hans"), + 119: ("Sinhala", "Sinh"), + 120: ("Sora Sompeng", "Sora"), + 121: ("Sundanese", "Sund"), + 122: ("Syloti Nagri", "Sylo"), + 123: ("Syriac", "Syrc"), + 124: ("Tagalog", "Tglg"), + 125: ("Tagbanwa", "Tagb"), + 126: ("Tai Le", "Tale"), + 127: ("Tai Viet", "Tavt"), + 128: ("Takri", "Takr"), + 129: ("Tamil", "Taml"), + 130: ("Tangut", "Tang"), + 131: ("Telugu", "Telu"), + 132: ("Thaana", "Thaa"), + 133: ("Thai", "Thai"), + 134: ("Tibetan", "Tibt"), + 135: ("Tifinagh", "Tfng"), + 136: ("Tirhuta", "Tirh"), + 137: ("Traditional Han", "Hant"), + 138: ("Ugaritic", "Ugar"), + 139: ("Vai", "Vaii"), + 140: ("Varang Kshiti", "Wara"), + 141: ("Yi", "Yiii"), } script_aliases = { |