summaryrefslogtreecommitdiffstats
path: root/util/locale_database/cldr2qlocalexml.py
diff options
context:
space:
mode:
Diffstat (limited to 'util/locale_database/cldr2qlocalexml.py')
-rwxr-xr-xutil/locale_database/cldr2qlocalexml.py153
1 files changed, 67 insertions, 86 deletions
diff --git a/util/locale_database/cldr2qlocalexml.py b/util/locale_database/cldr2qlocalexml.py
index 20dda77965..d3aa88ec38 100755
--- a/util/locale_database/cldr2qlocalexml.py
+++ b/util/locale_database/cldr2qlocalexml.py
@@ -1,48 +1,27 @@
-#!/usr/bin/env python2
-# coding=utf8
-#############################################################################
-##
-## Copyright (C) 2020 The Qt Company Ltd.
-## Contact: https://www.qt.io/licensing/
-##
-## This file is part of the test suite of the Qt Toolkit.
-##
-## $QT_BEGIN_LICENSE:GPL-EXCEPT$
-## Commercial License Usage
-## Licensees holding valid commercial Qt licenses may use this file in
-## accordance with the commercial license agreement provided with the
-## Software or, alternatively, in accordance with the terms contained in
-## a written agreement between you and The Qt Company. For licensing terms
-## and conditions see https://www.qt.io/terms-conditions. For further
-## information use the contact form at https://www.qt.io/contact-us.
-##
-## GNU General Public License Usage
-## Alternatively, this file may be used under the terms of the GNU
-## General Public License version 3 as published by the Free Software
-## Foundation with exceptions as appearing in the file LICENSE.GPL3-EXCEPT
-## included in the packaging of this file. Please review the following
-## information to ensure the GNU General Public License requirements will
-## be met: https://www.gnu.org/licenses/gpl-3.0.html.
-##
-## $QT_END_LICENSE$
-##
-#############################################################################
-"""Convert CLDR data to qLocaleXML
-
-The CLDR data can be downloaded from CLDR_, which has a sub-directory
-for each version; you need the ``core.zip`` file for your version of
-choice (typically the latest). This script has had updates to cope up
-to v38.1; for later versions, we may need adaptations. Unpack the
-downloaded ``core.zip`` and check it has a common/main/ sub-directory:
-pass the path of that root of the download to this script as its first
-command-line argument. Pass the name of the file in which to write
-output as the second argument; either omit it or use '-' to select the
-standard output. This file is the input needed by
-``./qlocalexml2cpp.py``
+#!/usr/bin/env python3
+# Copyright (C) 2021 The Qt Company Ltd.
+# SPDX-License-Identifier: LicenseRef-Qt-Commercial OR GPL-3.0-only WITH Qt-GPL-exception-1.0
+"""Convert CLDR data to QLocaleXML
+
+The CLDR data can be downloaded as a zip-file from CLDR_, which has a
+sub-directory for each version; you need the ``core.zip`` file for
+your version of choice (typically the latest), which you should then
+unpack. Alternatively, you can clone the git repo from github_, which
+has a tag for each release and a maint/maint-$ver branch for each
+major version. Either way, the CLDR top-level directory should have a
+subdirectory called common/ which contains (among other things)
+subdirectories main/ and supplemental/.
+
+This script has had updates to cope up to v44.1; for later versions,
+we may need adaptations. Pass the path of the CLDR top-level directory
+to this script as its first command-line argument. Pass the name of
+the file in which to write output as the second argument; either omit
+it or use '-' to select the standard output. This file is the input
+needed by ``./qlocalexml2cpp.py``
When you update the CLDR data, be sure to also update
src/corelib/text/qt_attribution.json's entry for unicode-cldr. Check
-this script's output for unknown language, country or script messages;
+this script's output for unknown language, territory or script messages;
if any can be resolved, use their entry in common/main/en.xml to
append new entries to enumdata.py's lists and update documentation in
src/corelib/text/qlocale.qdoc, adding the new entries in alphabetic
@@ -51,71 +30,73 @@ order.
While updating the locale data, check also for updates to MS-Win's
time zone names; see cldr2qtimezone.py for details.
-.. _CLDR: ftp://unicode.org/Public/cldr/
+All the scripts mentioned support --help to tell you how to use them.
+
+.. _CLDR: https://unicode.org/Public/cldr/
+.. _github: https://github.com/unicode-org/cldr
"""
-import os
-import sys
+from pathlib import Path
+import argparse
from cldr import CldrReader
from qlocalexml import QLocaleXmlWriter
-from enumdata import language_list, script_list, country_list
-
-def usage(name, err, message = ''):
- err.write("""Usage: {} path/to/cldr/common/main [out-file.xml]
-""".format(name)) # TODO: expand command-line, improve help message
- if message:
- err.write('\n' + message + '\n')
-
-def main(args, out, err):
- # TODO: make calendars a command-line option
- calendars = ['gregorian', 'persian', 'islamic'] # 'hebrew'
-
- # TODO: make argument parsing more sophisticated
- name = args.pop(0)
- if not args:
- usage(name, err, 'Where is your CLDR data tree ?')
- return 1
-
- root = args.pop(0)
- if not os.path.exists(os.path.join(root, 'common', 'main', 'root.xml')):
- usage(name, err,
- 'First argument is the root of the CLDR tree: found no common/main/root.xml under '
- + root)
- return 1
-
- xml = args.pop(0) if args else None
+
+
+def main(argv, out, err):
+ """Generate a QLocaleXML file from CLDR data.
+
+ Takes sys.argv, sys.stdout, sys.stderr (or equivalents) as
+ arguments. In argv[1:], it expects the root of the CLDR data
+ directory as first parameter and the name of the file in which to
+ save QLocaleXML data as second parameter. It accepts a --calendars
+ option to select which calendars to support (all available by
+ default)."""
+ all_calendars = ['gregorian', 'persian', 'islamic']
+
+ parser = argparse.ArgumentParser(
+ prog=Path(argv[0]).name,
+ description='Generate QLocaleXML from CLDR data.',
+ formatter_class=argparse.ArgumentDefaultsHelpFormatter)
+ parser.add_argument('cldr_path', help='path to the root of the CLDR tree')
+ parser.add_argument('out_file', help='output XML file name',
+ nargs='?', metavar='out-file.xml')
+ parser.add_argument('--calendars', help='select calendars to emit data for',
+ nargs='+', metavar='CALENDAR',
+ choices=all_calendars, default=all_calendars)
+
+ args = parser.parse_args(argv[1:])
+
+ root = Path(args.cldr_path)
+ root_xml_path = 'common/main/root.xml'
+
+ if not root.joinpath(root_xml_path).exists():
+ parser.error('First argument is the root of the CLDR tree: '
+ f'found no {root_xml_path} under {root}')
+
+ xml = args.out_file
if not xml or xml == '-':
emit = out
elif not xml.endswith('.xml'):
- usage(name, err, 'Please use a .xml extension on your output file name, not ' + xml)
- return 1
+ parser.error(f'Please use a .xml extension on your output file name, not {xml}')
else:
try:
emit = open(xml, 'w')
except IOError as e:
- usage(name, err, 'Failed to open "{}" to write output to it\n'.format(xml))
- return 1
-
- if args:
- usage(name, err, 'Too many arguments - excess: ' + ' '.join(args))
- return 1
-
- if emit.encoding != 'UTF-8' or (emit.encoding is None and sys.getdefaultencoding() != 'UTF-8'):
- reload(sys) # Weirdly, this gets a richer sys module than the plain import got us !
- sys.setdefaultencoding('UTF-8')
+ parser.error(f'Failed to open "{xml}" to write output to it')
# TODO - command line options to tune choice of grumble and whitter:
reader = CldrReader(root, err.write, err.write)
writer = QLocaleXmlWriter(emit.write)
writer.version(reader.root.cldrVersion)
- writer.enumData(language_list, script_list, country_list)
+ writer.enumData(reader.root.englishNaming)
writer.likelySubTags(reader.likelySubTags())
- writer.locales(reader.readLocales(calendars), calendars)
+ writer.locales(reader.readLocales(args.calendars), args.calendars)
- writer.close()
+ writer.close(err.write)
return 0
if __name__ == '__main__':
+ import sys
sys.exit(main(sys.argv, sys.stdout, sys.stderr))