aboutsummaryrefslogtreecommitdiff
path: root/test/_norm-test.h
blob: e4da60973a7171bcb4be1b1fb0d8ba68e4d09602 (plain) (blame)
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
62
63
64
65
66
67
68
69
70
71
72
73
74
75
76
77
78
79
80
81
82
83
84
85
86
87
88
89
90
91
92
93
94
95
96
97
98
99
100
101
102
103
104
105
106
#if !defined(NORMTYPE)
#	error "NORMTYPE must be defined"
#endif

#define _GNU_SOURCE
#include <stdio.h>
#include <stdlib.h>

#include <alloc.h>
#include <array.h>
#include <errors.h>
#include <macros.h>
#include <mbstring.h>
#include <rune.h>
#include <unicode/string.h>

#define TESTFILE "norm.in"

static bool test(u8view_t, int);

int
main(int, char **argv)
{
	int rv;
	size_t n;
	ssize_t nr;
	char *line;
	FILE *fp;

	rv = EXIT_SUCCESS;
	line = nullptr;
	mlib_setprogname(argv[0]);

	if ((fp = fopen(TESTFILE, "r")) == nullptr)
		err("fopen: %s:", TESTFILE);

	for (int id = 1; (nr = getline(&line, &n, fp)) > 0; id++) {
		if (line[nr - 1] == '\n')
			line[--nr] = '\0';

		if (!test((u8view_t){line, (size_t)nr}, id))
			rv = EXIT_FAILURE;
	}
	if (ferror(fp))
		err("getline: %s:", TESTFILE);

	free(line);
	fclose(fp);
	return rv;
}

bool
test(u8view_t sv, int id)
{
	bool rv = true;
	arena_ctx_t ctx = {};
	allocator_t mem = init_arena_allocator(&ctx, nullptr);

	u8view_t column;
	u8view_t *columns = array_new(mem, typeof(*columns), 64);

	while (ucscut(&column, &sv, U";", 1) != MBEND) {
		char8_t *s = array_new(mem, typeof(*s), 64);

		rune _;
		u8view_t cp;
		do {
			rune ch;
			_ = ucscut(&cp, &column, U" ", 1);
			sscanf(cp.p, "%" SCNxRUNE, &ch);
			char8_t buf[U8_LEN_MAX];
			int w = rtoucs(buf, sizeof(buf), ch);
			array_extend(s, buf, w);
		} while (_ != MBEND);

		array_push(&columns, ((u8view_t){s, array_len(s)}));
	}

	for (size_t i = 0; i < 5; i++) {
		size_t base;
		const char *nt = STR(NORMTYPE);
		if (streq(nt, "NF_NFC"))
			base = i < 3 ? 1 : 3;
		else if (streq(nt, "NF_NFD"))
			base = i < 3 ? 2 : 4;
		else if (streq(nt, "NF_NFKC"))
			base = 3;
		else if (streq(nt, "NF_NFKD"))
			base = 4;
		else
			err("invalid NORMTYPE ‘%s’", nt);

		u8view_t normd = {};
		normd.p = ucsnorm(&normd.len, columns[i], mem, NORMTYPE);
		if (!ucseq(columns[base], normd)) {
			warn("case %d: expected c%zu to be ‘%.*s’ but got ‘%.*s’", id,
			     i + 1, SV_PRI_ARGS(columns[base]), SV_PRI_ARGS(normd));
			rv = false;
			goto out;
		}
	}

out:
	deleteall(mem);
	return rv;
}