summaryrefslogtreecommitdiffstats
path: root/util/locale_database/enumdata.py
diff options
context:
space:
mode:
authorEdward Welbourne <edward.welbourne@qt.io>2025-11-13 18:20:23 +0100
committerEdward Welbourne <edward.welbourne@qt.io>2025-11-18 15:07:47 +0100
commit676e8f2570ad2208e170743024c25aabe30c81cc (patch)
treebdeaefea77a08b636cc721c1e819e5ea91feb41b /util/locale_database/enumdata.py
parent4bc6aa5f52926fefca87a6154fbeda62dcec177b (diff)
Include new languages for CLDR v48
Include two new languages, Ladin and Shan, and document the various languages and scripts that show up in the cldr2qlocalexml.py output, that I have checked and seen to contain inadequate information. This may make it easier for future updaters to spot new unknown codes when they show up. These are not picked back to past versions because they're naturally documented as [since 6.11] and picking would involve each past branch getting a minor version as its since. Fixes: QTBUG-141949 Change-Id: If0cb3e3b33cd3ce636fd29e904a9ddd617940314 Reviewed-by: Mate Barany <mate.barany@qt.io>
Diffstat (limited to 'util/locale_database/enumdata.py')
-rw-r--r--util/locale_database/enumdata.py42
1 files changed, 42 insertions, 0 deletions
diff --git a/util/locale_database/enumdata.py b/util/locale_database/enumdata.py
index e654fb4d1a9..17aa84c0893 100644
--- a/util/locale_database/enumdata.py
+++ b/util/locale_database/enumdata.py
@@ -411,12 +411,50 @@ language_map = {
# added in CLDR v46
345: ("Kara-Kalpak", "kaa"),
346: ("Swampy Cree", "csw"),
+ # added in CLDR v48
+ 347: ("Ladin", "lld"), # very minority (in Italy)
+ 348: ("Shan", "shn"),
}
# Don't add languages just because they exist; check CLDR does provide
# substantial data for locales using it; and check, once added, they
# don't show up in cldr2qlocalexml.py's unused listing. Do also check
# the data's draft status; if it's (nearly) all unconfirmed, leave it.
+# Known, but omitted because too little that isn't draft="unconfirmed",
+# at least at v48:
+# ("Betawi", "bew"),
+# ("Bakhtiari", "bqi"),
+# ("Buriat", "bua"),
+# ("Caddo", "cad"),
+# ("Choctaw", "cho"),
+# ("Hakka", "hak"), # or Hakka Chinese
+# ("Hassaniyya", "mey"),
+# ("Hmong Njua", "hnj"),
+# ("Qʼeqchiʼ", "kek"),
+# ("Lombard", "lmo"),
+# ("Latgalian", "ltg"),
+# ("Laz", "lzz"),
+# ("Min Nan", "nan"), # or Min Nan Chinese
+# ("Mi'kmaw", "mic"),
+# ("Mócheno", "mhn"),
+# ("Mundari", "unr"),
+# ("Okanagan", "oka"),
+# ("Hmong Daw", "mww"),
+# ("Okanagan", "oka"),
+# ("Piedmontese", "pms"),
+# ("Pontic", "pnt"),
+# ("Riffian", "rif"),
+# ("Samogitian", "sgs"),
+# ("Samtao", "stu"),
+# ("Saraiki", "skr"),
+# ("Sunwar", "suz"),
+# ("Tuvinian", "tyv"), # not far short of adequate
+# ("Makhuwa", "vmw"),
+
+# It can be helpful to look in supplemental/supplementalData.xml for
+# languagePopulation entries for codes not translated in en.xml (the
+# source used by these scripts) to map them to names.
+
language_aliases = {
# Renamings prior to Qt 6.0 (CLDR v37):
'Afan': 'Oromo',
@@ -888,6 +926,10 @@ script_map = {
# Added at CLDR v43
142: ("Hanifi", "Rohg"), # Used for Rohingya
}
+# Omitted for want of data (see similar after language_map):
+# ("Nyiakeng Puachue Hmong", "Hmnp"),
+# ("Sunuwar", "Sunu"),
+
script_aliases = {
# Renamings prior to Qt 6.0 (CLDR v37):