diff options
author | Thomas Voss <mail@thomasvoss.com> | 2024-04-22 21:27:07 +0200 |
---|---|---|
committer | Thomas Voss <mail@thomasvoss.com> | 2024-04-22 21:27:07 +0200 |
commit | eda8550f79f7f836a78f5909f1dccc008511d4f8 (patch) | |
tree | e2f801d7489a6eebeae92fef7b6b95c504668e44 /test/gen-test-data | |
parent | c0a983a29af17415ef29058d72f1a9cd99ddd83f (diff) |
Add a test for word breaking
Diffstat (limited to 'test/gen-test-data')
-rwxr-xr-x | test/gen-test-data | 11 |
1 files changed, 11 insertions, 0 deletions
diff --git a/test/gen-test-data b/test/gen-test-data new file mode 100755 index 0000000..12ee11e --- /dev/null +++ b/test/gen-test-data @@ -0,0 +1,11 @@ +#!/bin/sh + +set -e + +download() +{ + curl -sS "https://www.unicode.org/Public/15.1.0/ucd/$1" +} + +download 'auxiliary/WordBreakTest.txt' \ +| sed -En 's/\s+//g; s/รท?#.*//g; /./p' >wnext.in |