aboutsummaryrefslogtreecommitdiff
path: root/vendor/librune/gen/rtype-jt
blob: 81185ec6a2e9962bea00478e23426e05c922926d (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
#!/bin/sh

cache()
{
	name="/tmp/librune/rtype/$(basename "$1")"
	if test ! -f "$name"
	then
		mkdir -p /tmp/librune/rtype
		wget -q "$1" -O "$name"
	fi
}

set -e
cd "${0%/*}/.."
exec >include/internal/rtype/jt.h

readonly URL='https://www.unicode.org/Public/UCD/latest/ucd/extracted/DerivedJoiningType.txt'
cache "$URL"

cat <<C
/* This file is autogenerated by gen/rtype-jt; DO NOT EDIT. */

#ifndef RUNE_INTERNAL_RTYPE_JT_H
#define RUNE_INTERNAL_RTYPE_JT_H

/* IWYU pragma: private */
/* clang-format off */

#include "../types.h"
#include "../../rtype.h"
#include "../../rune.h"

static const rprop_jt_bf rtype_jt_lat1_tbl[] = {
C

gawk '
BEGIN {
	FS = "( *#.*| +; +)"
}

$2 ~ /[UCDRLT]/ {
	n = split($1, a, /\.\./)
	lo = strtonum("0X" a[1])
	hi = strtonum("0X" a[n])

	for (i = lo; i <= hi; i++)
		props[i] = $2
}

END {
	for (i = 0; i <= 0xFF; i++)
		printf "JT_%s,\n", props[i] ? props[i] : "U"
}
' /tmp/librune/rtype/DerivedJoiningType.txt \
| paste -d' ' - - - - - - - - \
| sed 's/^/\t/'

cat <<C
};

static const struct {
	rune lo, hi;
	rprop_jt_bf val;
} rtype_jt_tbl[] = {
C

gawk '
BEGIN {
	FS = "( *#.*| +; +)"
}

$2 ~ /[UCDRLT]/ {
	n = split($1, a, /\.\./)
	lo = strtonum("0X" a[1])
	hi = strtonum("0X" a[n])

	for (i = lo; i <= hi; i++)
		props[i] = $2
}

END {
	for (i = 0; i <= 0x10FFFF; i++) {
		if (!props[i])
			continue
		lo = i
		while (props[lo] == props[i + 1])
			i++
		printf "\t{RUNE_C(0x%06X), RUNE_C(0x%06X), JT_%s},\n", lo, i, props[lo]
	}
}
' /tmp/librune/rtype/DerivedJoiningType.txt | sort

cat <<C
};

#endif /* !RUNE_INTERNAL_RTYPE_JT_H */
C