aboutsummaryrefslogtreecommitdiff
path: root/gen
diff options
context:
space:
mode:
authorThomas Voss <mail@thomasvoss.com> 2024-04-18 11:44:31 +0200
committerThomas Voss <mail@thomasvoss.com> 2024-04-18 11:44:31 +0200
commit1616feb4901579da80452c95c6e0f732b945c7d5 (patch)
treea351d926c12adccb32e2913ea4a3a44422d6eea5 /gen
parent5d2bbdfe3191049bbd4bb237a31f34fdf62f347c (diff)
Add uprop_get_jg()
Diffstat (limited to 'gen')
-rwxr-xr-xgen/data-files1
-rwxr-xr-xgen/prop/jg52
2 files changed, 53 insertions, 0 deletions
diff --git a/gen/data-files b/gen/data-files
index 9222c10..9da5452 100755
--- a/gen/data-files
+++ b/gen/data-files
@@ -21,6 +21,7 @@ readonly PATHS='
extracted/DerivedBinaryProperties
extracted/DerivedDecompositionType
extracted/DerivedEastAsianWidth
+ extracted/DerivedJoiningGroup
extracted/DerivedJoiningType
extracted/DerivedLineBreak
extracted/DerivedNumericType
diff --git a/gen/prop/jg b/gen/prop/jg
new file mode 100755
index 0000000..e88442d
--- /dev/null
+++ b/gen/prop/jg
@@ -0,0 +1,52 @@
+#!/bin/sh
+
+set -e
+cd "${0%/*}/../.."
+exec >lib/unicode/prop/uprop_get_jg.c
+
+gawk '
+BEGIN {
+ FS = "[ ;]+"
+
+ print "/* This file is autogenerated by gen/prop/jg; DO NOT EDIT. */"
+ print ""
+ print "#include \"_bsearch.h\""
+ print "#include \"rune.h\""
+ print "#include \"unicode/prop.h\""
+ print ""
+}
+
+/^[A-F0-9]/ {
+ n = split($1, a, /\.\./)
+ lo = strtonum("0X" a[1])
+ hi = strtonum("0X" a[n])
+
+ for (i = lo; i <= hi; i++)
+ props[i] = "JG_" toupper($2)
+}
+
+END {
+ print "static const struct {"
+ print "\trune lo, hi;"
+ print "\tenum uprop_jg val;"
+ print "} lookup[] = {"
+
+ for (i = 0; i <= 0x10FFFF; i++) {
+ if (!props[i])
+ continue
+ for (lo = i; props[lo] == props[i + 1]; i++)
+ ;
+ printf "\t{RUNE_C(0x%06X), RUNE_C(0x%06X), %s},\n", lo, i, props[i]
+ }
+
+ print "};"
+ print ""
+ print "_MLIB_DEFINE_BSEARCH(enum uprop_jg, lookup, JG_NO_JOINING_GROUP)"
+ print ""
+ print "enum uprop_jg"
+ print "uprop_get_jg(rune ch)"
+ print "{"
+ print "\treturn ch < lookup[0].lo ? JG_NO_JOINING_GROUP : mlib_lookup(ch);"
+ print "}"
+}
+' data/DerivedJoiningGroup | sed 's/\s*$//'