aboutsummaryrefslogtreecommitdiff
path: root/gen/prop/gc
blob: 48c6659280b6dc4ac038affa6c29f4c3692aa392 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
#!/bin/sh

set -e
cd "${0%/*}/../.."
exec >include/unicode/__gc.h

cat <<C
/* This file is autogenerated by gen/prop/gc; DO NOT EDIT. */

#ifndef MLIB_UNICODE_PROP___GC_H
#define MLIB_UNICODE_PROP___GC_H

#include "unicode/prop.h"

static const enum uprop_gc __mlib_gc_lat1_lt[] = {
C

gawk '
BEGIN {
	FS = ";"
}

{
	s = "GC_" toupper($3)
	lo = strtonum("0X" $1)

	if ($2 ~ /First/) {
		getline
		hi = strtonum("0X" $1)
	} else
		hi = lo

	for (i = lo; i <= hi; i++)
		props[i] = s
}

END {
	for (i = 0; i <= 0xFF; i++)
		print props[i] ","
}
' data/UnicodeData.txt | paste -d' ' - - - - - - - - | sed 's/^/\t/'

cat <<C
};

static const struct {
	rune lo, hi;
	enum uprop_gc val;
} __mlib_gc_lt[] = {
C

gawk '
BEGIN {
	FS = ";"
}

{
	s = "GC_" toupper($3)
	lo = strtonum("0X" $1)

	if ($2 ~ /First/) {
		getline
		hi = strtonum("0X" $1)
	} else
		hi = lo

	for (i = lo; i <= hi; i++)
		props[i] = s
}

END {
	for (i = 0x100; i <= 0x10FFFF; i++) {
		if (!props[i])
			continue
		lo = i
		while (props[lo] == props[i + 1])
			i++
		printf "\t{RUNE_C(0x%06X), RUNE_C(0x%06X), %s},\n", lo, i, props[lo]
	}
}
' data/UnicodeData.txt | sort

cat <<C
};

#endif /* !MLIB_UNICODE_PROP___GC_H */
C