summaryrefslogtreecommitdiffstats
path: root/util/unicode/update_ucd.sh
blob: 64fee6ddc9263a90c47307b9f5e29dc382367099 (plain)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
#! /bin/sh
# Copyright (C) 2021 The Qt Company Ltd.
# SPDX-License-Identifier: LicenseRef-Qt-Commercial OR GPL-3.0-only WITH Qt-GPL-exception-1.0

# This script downloads UCD files for an Unicode release and updates the
# copies used by Qt. It expects the new Unicode version as argument:
#
#      $ ./update_ucd.sh 14.0.0

set -e

if [ "$#" -ne 1 ]
then
    echo "Usage: $0 <UNICODE-VERSION>" >&2
    exit 1
fi

VERSION="$1"

qtbase=$(realpath "$(dirname "$0")"/../..)
tmp=$(mktemp)

download()
{
    wget -nv -P "$tmp" "$1"
}

download "https://www.unicode.org/Public/zipped/$VERSION/UCD.zip"
unzip -q "$tmp/UCD.zip" -d "$tmp"
download "https://www.unicode.org/Public/idna/$VERSION/IdnaMappingTable.txt"
download "https://www.unicode.org/Public/idna/$VERSION/IdnaTestV2.txt"

data_dirs="util/unicode/data \
tests/auto/corelib/io/qurluts46/testdata \
tests/auto/corelib/text/qtextboundaryfinder/data"

for dir in $data_dirs
do
    find "$qtbase/$dir" -name '*.txt' -o -name '*.html'
done | grep -vw 'ReadMe.*\.txt' | while read -r file
do
    base_name=$(basename "$file")
    echo "Updating ${base_name}"
    full_name=$(find "$tmp" -name "$base_name" -print -quit)
    if [ "$full_name" = "" ]
    then
        echo "No source file for: ${base_name}" >&2
        exit 1
    fi
    cp "$full_name" "$file"
done

rm -rf "$tmp"