aboutsummaryrefslogtreecommitdiff
path: root/test/gen-test-data
diff options
context:
space:
mode:
authorThomas Voss <mail@thomasvoss.com> 2024-04-22 21:27:07 +0200
committerThomas Voss <mail@thomasvoss.com> 2024-04-22 21:27:07 +0200
commiteda8550f79f7f836a78f5909f1dccc008511d4f8 (patch)
treee2f801d7489a6eebeae92fef7b6b95c504668e44 /test/gen-test-data
parentc0a983a29af17415ef29058d72f1a9cd99ddd83f (diff)
Add a test for word breaking
Diffstat (limited to 'test/gen-test-data')
-rwxr-xr-xtest/gen-test-data11
1 files changed, 11 insertions, 0 deletions
diff --git a/test/gen-test-data b/test/gen-test-data
new file mode 100755
index 0000000..12ee11e
--- /dev/null
+++ b/test/gen-test-data
@@ -0,0 +1,11 @@
+#!/bin/sh
+
+set -e
+
+download()
+{
+ curl -sS "https://www.unicode.org/Public/15.1.0/ucd/$1"
+}
+
+download 'auxiliary/WordBreakTest.txt' \
+| sed -En 's/\s+//g; s/รท?#.*//g; /./p' >wnext.in