Fix script for characters in 3300..3357 range

* admin/unidata/blocks.awk: The characters in the 3300..3357 range
are Katakana according to Unicode's Scripts.txt.
This commit is contained in:
Eli Zaretskii 2024-08-17 11:01:12 +03:00
parent 661e5dec57
commit c70ac0fef1

View file

@ -146,6 +146,19 @@ FILENAME ~ "Blocks.txt" && /^[0-9A-F]/ {
end[i] = fix_end[e] ? fix_end[e]: e
name[i] = $0
# Hard-coded splits that must be processed before name2alias and
# before combining same-named adjacent ranges.
if (start[i] == "3300") # See Scripts.txt
{
end[i] = "3357"
name[i] = "Katakana"
alt[i] = "kana"
i++
start[i] = "3358"
end[i] = "33FF"
name[i] = "CJK Compatibility"
}
alt[i] = name2alias(name[i])
if (!alt[i])