2020-04-03 08:30:08 +02:00
|
|
|
#
|
|
|
|
# parse-unidata.awk - generate a table (unicode_case_mapping_upper)
|
|
|
|
#
|
|
|
|
# Copyright (C) 2020 g10 Code GmbH
|
|
|
|
#
|
|
|
|
# This file is part of GnuPG.
|
|
|
|
#
|
|
|
|
# GnuPG is free software; you can redistribute it and/or modify
|
|
|
|
# it under the terms of the GNU General Public License as published by
|
|
|
|
# the Free Software Foundation; either version 3 of the License, or
|
|
|
|
# (at your option) any later version.
|
|
|
|
#
|
|
|
|
# GnuPG is distributed in the hope that it will be useful,
|
|
|
|
# but WITHOUT ANY WARRANTY; without even the implied warranty of
|
|
|
|
# MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the
|
|
|
|
# GNU General Public License for more details.
|
|
|
|
#
|
|
|
|
# You should have received a copy of the GNU General Public License
|
|
|
|
# along with this program; if not, see <https://www.gnu.org/licenses/>.
|
|
|
|
#
|
|
|
|
|
|
|
|
# Parse the unicode data from:
|
|
|
|
# https://www.unicode.org/Public/UCD/latest/ucd/UnicodeData.txt
|
|
|
|
# to generate case mapping table
|
|
|
|
|
|
|
|
BEGIN {
|
|
|
|
print("/* Generated from UnicodeData.txt */")
|
|
|
|
print("")
|
|
|
|
print("static const struct casemap unicode_case_mapping_upper[] = {")
|
|
|
|
FS = ";"
|
|
|
|
count = 0
|
|
|
|
}
|
|
|
|
|
|
|
|
{
|
2020-04-15 07:10:08 +02:00
|
|
|
code = int("0x" $1)
|
2020-04-03 08:30:08 +02:00
|
|
|
name = $2
|
|
|
|
class = $3
|
|
|
|
upper = $13
|
|
|
|
lower = $14
|
|
|
|
title = $15
|
|
|
|
|
2020-04-15 07:10:08 +02:00
|
|
|
if (code <= 127) {
|
2020-04-03 08:30:08 +02:00
|
|
|
next
|
|
|
|
}
|
2020-04-15 07:10:08 +02:00
|
|
|
if (code > 65535) {
|
2020-04-03 08:30:08 +02:00
|
|
|
next
|
|
|
|
}
|
|
|
|
if ($3 !~ /^L.*/) {
|
|
|
|
next
|
|
|
|
}
|
|
|
|
if (upper != "") {
|
|
|
|
printf("\t{ 0x" tolower($1) ", 0x" tolower(upper) " },")
|
|
|
|
count++
|
|
|
|
if ((count % 4) == 0) {
|
|
|
|
print("")
|
|
|
|
}
|
|
|
|
}
|
|
|
|
}
|
|
|
|
|
|
|
|
END {
|
|
|
|
print("\n};")
|
|
|
|
}
|