aboutsummaryrefslogtreecommitdiff
diff options
context:
space:
mode:
authorThomas Voss <mail@thomasvoss.com> 2024-04-15 14:13:25 +0200
committerThomas Voss <mail@thomasvoss.com> 2024-04-15 14:13:25 +0200
commit6713c56fee21a549ff8a3494bbb52da9234a00aa (patch)
treecb73e39d6b344348dbcbd71cecf0318d644d020f
parentb12a2227b37b79f4bb8cd69143d13c99ad04df96 (diff)
Add uprop_get_sc()
-rw-r--r--data/Scripts3033
-rwxr-xr-xgen/data-files1
-rwxr-xr-xgen/prop/sc232
-rw-r--r--include/unicode/prop.h169
-rw-r--r--lib/unicode/prop/uprop_get_sc.c995
5 files changed, 4430 insertions, 0 deletions
diff --git a/data/Scripts b/data/Scripts
new file mode 100644
index 0000000..0b3f717
--- /dev/null
+++ b/data/Scripts
@@ -0,0 +1,3033 @@
+# Scripts-15.1.0.txt
+# Date: 2023-07-28, 16:01:07 GMT
+# © 2023 Unicode®, Inc.
+# Unicode and the Unicode Logo are registered trademarks of Unicode, Inc. in the U.S. and other countries.
+# For terms of use, see https://www.unicode.org/terms_of_use.html
+#
+# Unicode Character Database
+# For documentation, see https://www.unicode.org/reports/tr44/
+# For more information, see:
+# UAX #24, Unicode Script Property: https://www.unicode.org/reports/tr24/
+# Especially the sections:
+# https://www.unicode.org/reports/tr24/#Assignment_Script_Values
+# https://www.unicode.org/reports/tr24/#Assignment_ScriptX_Values
+#
+
+# ================================================
+
+# Property: Script
+
+# All code points not explicitly listed for Script
+# have the value Unknown (Zzzz).
+
+# @missing: 0000..10FFFF; Unknown
+
+# ================================================
+
+0000..001F ; Common # Cc [32] <control-0000>..<control-001F>
+0020 ; Common # Zs SPACE
+0021..0023 ; Common # Po [3] EXCLAMATION MARK..NUMBER SIGN
+0024 ; Common # Sc DOLLAR SIGN
+0025..0027 ; Common # Po [3] PERCENT SIGN..APOSTROPHE
+0028 ; Common # Ps LEFT PARENTHESIS
+0029 ; Common # Pe RIGHT PARENTHESIS
+002A ; Common # Po ASTERISK
+002B ; Common # Sm PLUS SIGN
+002C ; Common # Po COMMA
+002D ; Common # Pd HYPHEN-MINUS
+002E..002F ; Common # Po [2] FULL STOP..SOLIDUS
+0030..0039 ; Common # Nd [10] DIGIT ZERO..DIGIT NINE
+003A..003B ; Common # Po [2] COLON..SEMICOLON
+003C..003E ; Common # Sm [3] LESS-THAN SIGN..GREATER-THAN SIGN
+003F..0040 ; Common # Po [2] QUESTION MARK..COMMERCIAL AT
+005B ; Common # Ps LEFT SQUARE BRACKET
+005C ; Common # Po REVERSE SOLIDUS
+005D ; Common # Pe RIGHT SQUARE BRACKET
+005E ; Common # Sk CIRCUMFLEX ACCENT
+005F ; Common # Pc LOW LINE
+0060 ; Common # Sk GRAVE ACCENT
+007B ; Common # Ps LEFT CURLY BRACKET
+007C ; Common # Sm VERTICAL LINE
+007D ; Common # Pe RIGHT CURLY BRACKET
+007E ; Common # Sm TILDE
+007F..009F ; Common # Cc [33] <control-007F>..<control-009F>
+00A0 ; Common # Zs NO-BREAK SPACE
+00A1 ; Common # Po INVERTED EXCLAMATION MARK
+00A2..00A5 ; Common # Sc [4] CENT SIGN..YEN SIGN
+00A6 ; Common # So BROKEN BAR
+00A7 ; Common # Po SECTION SIGN
+00A8 ; Common # Sk DIAERESIS
+00A9 ; Common # So COPYRIGHT SIGN
+00AB ; Common # Pi LEFT-POINTING DOUBLE ANGLE QUOTATION MARK
+00AC ; Common # Sm NOT SIGN
+00AD ; Common # Cf SOFT HYPHEN
+00AE ; Common # So REGISTERED SIGN
+00AF ; Common # Sk MACRON
+00B0 ; Common # So DEGREE SIGN
+00B1 ; Common # Sm PLUS-MINUS SIGN
+00B2..00B3 ; Common # No [2] SUPERSCRIPT TWO..SUPERSCRIPT THREE
+00B4 ; Common # Sk ACUTE ACCENT
+00B5 ; Common # L& MICRO SIGN
+00B6..00B7 ; Common # Po [2] PILCROW SIGN..MIDDLE DOT
+00B8 ; Common # Sk CEDILLA
+00B9 ; Common # No SUPERSCRIPT ONE
+00BB ; Common # Pf RIGHT-POINTING DOUBLE ANGLE QUOTATION MARK
+00BC..00BE ; Common # No [3] VULGAR FRACTION ONE QUARTER..VULGAR FRACTION THREE QUARTERS
+00BF ; Common # Po INVERTED QUESTION MARK
+00D7 ; Common # Sm MULTIPLICATION SIGN
+00F7 ; Common # Sm DIVISION SIGN
+02B9..02C1 ; Common # Lm [9] MODIFIER LETTER PRIME..MODIFIER LETTER REVERSED GLOTTAL STOP
+02C2..02C5 ; Common # Sk [4] MODIFIER LETTER LEFT ARROWHEAD..MODIFIER LETTER DOWN ARROWHEAD
+02C6..02D1 ; Common # Lm [12] MODIFIER LETTER CIRCUMFLEX ACCENT..MODIFIER LETTER HALF TRIANGULAR COLON
+02D2..02DF ; Common # Sk [14] MODIFIER LETTER CENTRED RIGHT HALF RING..MODIFIER LETTER CROSS ACCENT
+02E5..02E9 ; Common # Sk [5] MODIFIER LETTER EXTRA-HIGH TONE BAR..MODIFIER LETTER EXTRA-LOW TONE BAR
+02EC ; Common # Lm MODIFIER LETTER VOICING
+02ED ; Common # Sk MODIFIER LETTER UNASPIRATED
+02EE ; Common # Lm MODIFIER LETTER DOUBLE APOSTROPHE
+02EF..02FF ; Common # Sk [17] MODIFIER LETTER LOW DOWN ARROWHEAD..MODIFIER LETTER LOW LEFT ARROW
+0374 ; Common # Lm GREEK NUMERAL SIGN
+037E ; Common # Po GREEK QUESTION MARK
+0385 ; Common # Sk GREEK DIALYTIKA TONOS
+0387 ; Common # Po GREEK ANO TELEIA
+0605 ; Common # Cf ARABIC NUMBER MARK ABOVE
+060C ; Common # Po ARABIC COMMA
+061B ; Common # Po ARABIC SEMICOLON
+061F ; Common # Po ARABIC QUESTION MARK
+0640 ; Common # Lm ARABIC TATWEEL
+06DD ; Common # Cf ARABIC END OF AYAH
+08E2 ; Common # Cf ARABIC DISPUTED END OF AYAH
+0964..0965 ; Common # Po [2] DEVANAGARI DANDA..DEVANAGARI DOUBLE DANDA
+0E3F ; Common # Sc THAI CURRENCY SYMBOL BAHT
+0FD5..0FD8 ; Common # So [4] RIGHT-FACING SVASTI SIGN..LEFT-FACING SVASTI SIGN WITH DOTS
+10FB ; Common # Po GEORGIAN PARAGRAPH SEPARATOR
+16EB..16ED ; Common # Po [3] RUNIC SINGLE PUNCTUATION..RUNIC CROSS PUNCTUATION
+1735..1736 ; Common # Po [2] PHILIPPINE SINGLE PUNCTUATION..PHILIPPINE DOUBLE PUNCTUATION
+1802..1803 ; Common # Po [2] MONGOLIAN COMMA..MONGOLIAN FULL STOP
+1805 ; Common # Po MONGOLIAN FOUR DOTS
+1CD3 ; Common # Po VEDIC SIGN NIHSHVASA
+1CE1 ; Common # Mc VEDIC TONE ATHARVAVEDIC INDEPENDENT SVARITA
+1CE9..1CEC ; Common # Lo [4] VEDIC SIGN ANUSVARA ANTARGOMUKHA..VEDIC SIGN ANUSVARA VAMAGOMUKHA WITH TAIL
+1CEE..1CF3 ; Common # Lo [6] VEDIC SIGN HEXIFORM LONG ANUSVARA..VEDIC SIGN ROTATED ARDHAVISARGA
+1CF5..1CF6 ; Common # Lo [2] VEDIC SIGN JIHVAMULIYA..VEDIC SIGN UPADHMANIYA
+1CF7 ; Common # Mc VEDIC SIGN ATIKRAMA
+1CFA ; Common # Lo VEDIC SIGN DOUBLE ANUSVARA ANTARGOMUKHA
+2000..200A ; Common # Zs [11] EN QUAD..HAIR SPACE
+200B ; Common # Cf ZERO WIDTH SPACE
+200E..200F ; Common # Cf [2] LEFT-TO-RIGHT MARK..RIGHT-TO-LEFT MARK
+2010..2015 ; Common # Pd [6] HYPHEN..HORIZONTAL BAR
+2016..2017 ; Common # Po [2] DOUBLE VERTICAL LINE..DOUBLE LOW LINE
+2018 ; Common # Pi LEFT SINGLE QUOTATION MARK
+2019 ; Common # Pf RIGHT SINGLE QUOTATION MARK
+201A ; Common # Ps SINGLE LOW-9 QUOTATION MARK
+201B..201C ; Common # Pi [2] SINGLE HIGH-REVERSED-9 QUOTATION MARK..LEFT DOUBLE QUOTATION MARK
+201D ; Common # Pf RIGHT DOUBLE QUOTATION MARK
+201E ; Common # Ps DOUBLE LOW-9 QUOTATION MARK
+201F ; Common # Pi DOUBLE HIGH-REVERSED-9 QUOTATION MARK
+2020..2027 ; Common # Po [8] DAGGER..HYPHENATION POINT
+2028 ; Common # Zl LINE SEPARATOR
+2029 ; Common # Zp PARAGRAPH SEPARATOR
+202A..202E ; Common # Cf [5] LEFT-TO-RIGHT EMBEDDING..RIGHT-TO-LEFT OVERRIDE
+202F ; Common # Zs NARROW NO-BREAK SPACE
+2030..2038 ; Common # Po [9] PER MILLE SIGN..CARET
+2039 ; Common # Pi SINGLE LEFT-POINTING ANGLE QUOTATION MARK
+203A ; Common # Pf SINGLE RIGHT-POINTING ANGLE QUOTATION MARK
+203B..203E ; Common # Po [4] REFERENCE MARK..OVERLINE
+203F..2040 ; Common # Pc [2] UNDERTIE..CHARACTER TIE
+2041..2043 ; Common # Po [3] CARET INSERTION POINT..HYPHEN BULLET
+2044 ; Common # Sm FRACTION SLASH
+2045 ; Common # Ps LEFT SQUARE BRACKET WITH QUILL
+2046 ; Common # Pe RIGHT SQUARE BRACKET WITH QUILL
+2047..2051 ; Common # Po [11] DOUBLE QUESTION MARK..TWO ASTERISKS ALIGNED VERTICALLY
+2052 ; Common # Sm COMMERCIAL MINUS SIGN
+2053 ; Common # Po SWUNG DASH
+2054 ; Common # Pc INVERTED UNDERTIE
+2055..205E ; Common # Po [10] FLOWER PUNCTUATION MARK..VERTICAL FOUR DOTS
+205F ; Common # Zs MEDIUM MATHEMATICAL SPACE
+2060..2064 ; Common # Cf [5] WORD JOINER..INVISIBLE PLUS
+2066..206F ; Common # Cf [10] LEFT-TO-RIGHT ISOLATE..NOMINAL DIGIT SHAPES
+2070 ; Common # No SUPERSCRIPT ZERO
+2074..2079 ; Common # No [6] SUPERSCRIPT FOUR..SUPERSCRIPT NINE
+207A..207C ; Common # Sm [3] SUPERSCRIPT PLUS SIGN..SUPERSCRIPT EQUALS SIGN
+207D ; Common # Ps SUPERSCRIPT LEFT PARENTHESIS
+207E ; Common # Pe SUPERSCRIPT RIGHT PARENTHESIS
+2080..2089 ; Common # No [10] SUBSCRIPT ZERO..SUBSCRIPT NINE
+208A..208C ; Common # Sm [3] SUBSCRIPT PLUS SIGN..SUBSCRIPT EQUALS SIGN
+208D ; Common # Ps SUBSCRIPT LEFT PARENTHESIS
+208E ; Common # Pe SUBSCRIPT RIGHT PARENTHESIS
+20A0..20C0 ; Common # Sc [33] EURO-CURRENCY SIGN..SOM SIGN
+2100..2101 ; Common # So [2] ACCOUNT OF..ADDRESSED TO THE SUBJECT
+2102 ; Common # L& DOUBLE-STRUCK CAPITAL C
+2103..2106 ; Common # So [4] DEGREE CELSIUS..CADA UNA
+2107 ; Common # L& EULER CONSTANT
+2108..2109 ; Common # So [2] SCRUPLE..DEGREE FAHRENHEIT
+210A..2113 ; Common # L& [10] SCRIPT SMALL G..SCRIPT SMALL L
+2114 ; Common # So L B BAR SYMBOL
+2115 ; Common # L& DOUBLE-STRUCK CAPITAL N
+2116..2117 ; Common # So [2] NUMERO SIGN..SOUND RECORDING COPYRIGHT
+2118 ; Common # Sm SCRIPT CAPITAL P
+2119..211D ; Common # L& [5] DOUBLE-STRUCK CAPITAL P..DOUBLE-STRUCK CAPITAL R
+211E..2123 ; Common # So [6] PRESCRIPTION TAKE..VERSICLE
+2124 ; Common # L& DOUBLE-STRUCK CAPITAL Z
+2125 ; Common # So OUNCE SIGN
+2127 ; Common # So INVERTED OHM SIGN
+2128 ; Common # L& BLACK-LETTER CAPITAL Z
+2129 ; Common # So TURNED GREEK SMALL LETTER IOTA
+212C..212D ; Common # L& [2] SCRIPT CAPITAL B..BLACK-LETTER CAPITAL C
+212E ; Common # So ESTIMATED SYMBOL
+212F..2131 ; Common # L& [3] SCRIPT SMALL E..SCRIPT CAPITAL F
+2133..2134 ; Common # L& [2] SCRIPT CAPITAL M..SCRIPT SMALL O
+2135..2138 ; Common # Lo [4] ALEF SYMBOL..DALET SYMBOL
+2139 ; Common # L& INFORMATION SOURCE
+213A..213B ; Common # So [2] ROTATED CAPITAL Q..FACSIMILE SIGN
+213C..213F ; Common # L& [4] DOUBLE-STRUCK SMALL PI..DOUBLE-STRUCK CAPITAL PI
+2140..2144 ; Common # Sm [5] DOUBLE-STRUCK N-ARY SUMMATION..TURNED SANS-SERIF CAPITAL Y
+2145..2149 ; Common # L& [5] DOUBLE-STRUCK ITALIC CAPITAL D..DOUBLE-STRUCK ITALIC SMALL J
+214A ; Common # So PROPERTY LINE
+214B ; Common # Sm TURNED AMPERSAND
+214C..214D ; Common # So [2] PER SIGN..AKTIESELSKAB
+214F ; Common # So SYMBOL FOR SAMARITAN SOURCE
+2150..215F ; Common # No [16] VULGAR FRACTION ONE SEVENTH..FRACTION NUMERATOR ONE
+2189 ; Common # No VULGAR FRACTION ZERO THIRDS
+218A..218B ; Common # So [2] TURNED DIGIT TWO..TURNED DIGIT THREE
+2190..2194 ; Common # Sm [5] LEFTWARDS ARROW..LEFT RIGHT ARROW
+2195..2199 ; Common # So [5] UP DOWN ARROW..SOUTH WEST ARROW
+219A..219B ; Common # Sm [2] LEFTWARDS ARROW WITH STROKE..RIGHTWARDS ARROW WITH STROKE
+219C..219F ; Common # So [4] LEFTWARDS WAVE ARROW..UPWARDS TWO HEADED ARROW
+21A0 ; Common # Sm RIGHTWARDS TWO HEADED ARROW
+21A1..21A2 ; Common # So [2] DOWNWARDS TWO HEADED ARROW..LEFTWARDS ARROW WITH TAIL
+21A3 ; Common # Sm RIGHTWARDS ARROW WITH TAIL
+21A4..21A5 ; Common # So [2] LEFTWARDS ARROW FROM BAR..UPWARDS ARROW FROM BAR
+21A6 ; Common # Sm RIGHTWARDS ARROW FROM BAR
+21A7..21AD ; Common # So [7] DOWNWARDS ARROW FROM BAR..LEFT RIGHT WAVE ARROW
+21AE ; Common # Sm LEFT RIGHT ARROW WITH STROKE
+21AF..21CD ; Common # So [31] DOWNWARDS ZIGZAG ARROW..LEFTWARDS DOUBLE ARROW WITH STROKE
+21CE..21CF ; Common # Sm [2] LEFT RIGHT DOUBLE ARROW WITH STROKE..RIGHTWARDS DOUBLE ARROW WITH STROKE
+21D0..21D1 ; Common # So [2] LEFTWARDS DOUBLE ARROW..UPWARDS DOUBLE ARROW
+21D2 ; Common # Sm RIGHTWARDS DOUBLE ARROW
+21D3 ; Common # So DOWNWARDS DOUBLE ARROW
+21D4 ; Common # Sm LEFT RIGHT DOUBLE ARROW
+21D5..21F3 ; Common # So [31] UP DOWN DOUBLE ARROW..UP DOWN WHITE ARROW
+21F4..22FF ; Common # Sm [268] RIGHT ARROW WITH SMALL CIRCLE..Z NOTATION BAG MEMBERSHIP
+2300..2307 ; Common # So [8] DIAMETER SIGN..WAVY LINE
+2308 ; Common # Ps LEFT CEILING
+2309 ; Common # Pe RIGHT CEILING
+230A ; Common # Ps LEFT FLOOR
+230B ; Common # Pe RIGHT FLOOR
+230C..231F ; Common # So [20] BOTTOM RIGHT CROP..BOTTOM RIGHT CORNER
+2320..2321 ; Common # Sm [2] TOP HALF INTEGRAL..BOTTOM HALF INTEGRAL
+2322..2328 ; Common # So [7] FROWN..KEYBOARD
+2329 ; Common # Ps LEFT-POINTING ANGLE BRACKET
+232A ; Common # Pe RIGHT-POINTING ANGLE BRACKET
+232B..237B ; Common # So [81] ERASE TO THE LEFT..NOT CHECK MARK
+237C ; Common # Sm RIGHT ANGLE WITH DOWNWARDS ZIGZAG ARROW
+237D..239A ; Common # So [30] SHOULDERED OPEN BOX..CLEAR SCREEN SYMBOL
+239B..23B3 ; Common # Sm [25] LEFT PARENTHESIS UPPER HOOK..SUMMATION BOTTOM
+23B4..23DB ; Common # So [40] TOP SQUARE BRACKET..FUSE
+23DC..23E1 ; Common # Sm [6] TOP PARENTHESIS..BOTTOM TORTOISE SHELL BRACKET
+23E2..2426 ; Common # So [69] WHITE TRAPEZIUM..SYMBOL FOR SUBSTITUTE FORM TWO
+2440..244A ; Common # So [11] OCR HOOK..OCR DOUBLE BACKSLASH
+2460..249B ; Common # No [60] CIRCLED DIGIT ONE..NUMBER TWENTY FULL STOP
+249C..24E9 ; Common # So [78] PARENTHESIZED LATIN SMALL LETTER A..CIRCLED LATIN SMALL LETTER Z
+24EA..24FF ; Common # No [22] CIRCLED DIGIT ZERO..NEGATIVE CIRCLED DIGIT ZERO
+2500..25B6 ; Common # So [183] BOX DRAWINGS LIGHT HORIZONTAL..BLACK RIGHT-POINTING TRIANGLE
+25B7 ; Common # Sm WHITE RIGHT-POINTING TRIANGLE
+25B8..25C0 ; Common # So [9] BLACK RIGHT-POINTING SMALL TRIANGLE..BLACK LEFT-POINTING TRIANGLE
+25C1 ; Common # Sm WHITE LEFT-POINTING TRIANGLE
+25C2..25F7 ; Common # So [54] BLACK LEFT-POINTING SMALL TRIANGLE..WHITE CIRCLE WITH UPPER RIGHT QUADRANT
+25F8..25FF ; Common # Sm [8] UPPER LEFT TRIANGLE..LOWER RIGHT TRIANGLE
+2600..266E ; Common # So [111] BLACK SUN WITH RAYS..MUSIC NATURAL SIGN
+266F ; Common # Sm MUSIC SHARP SIGN
+2670..2767 ; Common # So [248] WEST SYRIAC CROSS..ROTATED FLORAL HEART BULLET
+2768 ; Common # Ps MEDIUM LEFT PARENTHESIS ORNAMENT
+2769 ; Common # Pe MEDIUM RIGHT PARENTHESIS ORNAMENT
+276A ; Common # Ps MEDIUM FLATTENED LEFT PARENTHESIS ORNAMENT
+276B ; Common # Pe MEDIUM FLATTENED RIGHT PARENTHESIS ORNAMENT
+276C ; Common # Ps MEDIUM LEFT-POINTING ANGLE BRACKET ORNAMENT
+276D ; Common # Pe MEDIUM RIGHT-POINTING ANGLE BRACKET ORNAMENT
+276E ; Common # Ps HEAVY LEFT-POINTING ANGLE QUOTATION MARK ORNAMENT
+276F ; Common # Pe HEAVY RIGHT-POINTING ANGLE QUOTATION MARK ORNAMENT
+2770 ; Common # Ps HEAVY LEFT-POINTING ANGLE BRACKET ORNAMENT
+2771 ; Common # Pe HEAVY RIGHT-POINTING ANGLE BRACKET ORNAMENT
+2772 ; Common # Ps LIGHT LEFT TORTOISE SHELL BRACKET ORNAMENT
+2773 ; Common # Pe LIGHT RIGHT TORTOISE SHELL BRACKET ORNAMENT
+2774 ; Common # Ps MEDIUM LEFT CURLY BRACKET ORNAMENT
+2775 ; Common # Pe MEDIUM RIGHT CURLY BRACKET ORNAMENT
+2776..2793 ; Common # No [30] DINGBAT NEGATIVE CIRCLED DIGIT ONE..DINGBAT NEGATIVE CIRCLED SANS-SERIF NUMBER TEN
+2794..27BF ; Common # So [44] HEAVY WIDE-HEADED RIGHTWARDS ARROW..DOUBLE CURLY LOOP
+27C0..27C4 ; Common # Sm [5] THREE DIMENSIONAL ANGLE..OPEN SUPERSET
+27C5 ; Common # Ps LEFT S-SHAPED BAG DELIMITER
+27C6 ; Common # Pe RIGHT S-SHAPED BAG DELIMITER
+27C7..27E5 ; Common # Sm [31] OR WITH DOT INSIDE..WHITE SQUARE WITH RIGHTWARDS TICK
+27E6 ; Common # Ps MATHEMATICAL LEFT WHITE SQUARE BRACKET
+27E7 ; Common # Pe MATHEMATICAL RIGHT WHITE SQUARE BRACKET
+27E8 ; Common # Ps MATHEMATICAL LEFT ANGLE BRACKET
+27E9 ; Common # Pe MATHEMATICAL RIGHT ANGLE BRACKET
+27EA ; Common # Ps MATHEMATICAL LEFT DOUBLE ANGLE BRACKET
+27EB ; Common # Pe MATHEMATICAL RIGHT DOUBLE ANGLE BRACKET
+27EC ; Common # Ps MATHEMATICAL LEFT WHITE TORTOISE SHELL BRACKET
+27ED ; Common # Pe MATHEMATICAL RIGHT WHITE TORTOISE SHELL BRACKET
+27EE ; Common # Ps MATHEMATICAL LEFT FLATTENED PARENTHESIS
+27EF ; Common # Pe MATHEMATICAL RIGHT FLATTENED PARENTHESIS
+27F0..27FF ; Common # Sm [16] UPWARDS QUADRUPLE ARROW..LONG RIGHTWARDS SQUIGGLE ARROW
+2900..2982 ; Common # Sm [131] RIGHTWARDS TWO-HEADED ARROW WITH VERTICAL STROKE..Z NOTATION TYPE COLON
+2983 ; Common # Ps LEFT WHITE CURLY BRACKET
+2984 ; Common # Pe RIGHT WHITE CURLY BRACKET
+2985 ; Common # Ps LEFT WHITE PARENTHESIS
+2986 ; Common # Pe RIGHT WHITE PARENTHESIS
+2987 ; Common # Ps Z NOTATION LEFT IMAGE BRACKET
+2988 ; Common # Pe Z NOTATION RIGHT IMAGE BRACKET
+2989 ; Common # Ps Z NOTATION LEFT BINDING BRACKET
+298A ; Common # Pe Z NOTATION RIGHT BINDING BRACKET
+298B ; Common # Ps LEFT SQUARE BRACKET WITH UNDERBAR
+298C ; Common # Pe RIGHT SQUARE BRACKET WITH UNDERBAR
+298D ; Common # Ps LEFT SQUARE BRACKET WITH TICK IN TOP CORNER
+298E ; Common # Pe RIGHT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
+298F ; Common # Ps LEFT SQUARE BRACKET WITH TICK IN BOTTOM CORNER
+2990 ; Common # Pe RIGHT SQUARE BRACKET WITH TICK IN TOP CORNER
+2991 ; Common # Ps LEFT ANGLE BRACKET WITH DOT
+2992 ; Common # Pe RIGHT ANGLE BRACKET WITH DOT
+2993 ; Common # Ps LEFT ARC LESS-THAN BRACKET
+2994 ; Common # Pe RIGHT ARC GREATER-THAN BRACKET
+2995 ; Common # Ps DOUBLE LEFT ARC GREATER-THAN BRACKET
+2996 ; Common # Pe DOUBLE RIGHT ARC LESS-THAN BRACKET
+2997 ; Common # Ps LEFT BLACK TORTOISE SHELL BRACKET
+2998 ; Common # Pe RIGHT BLACK TORTOISE SHELL BRACKET
+2999..29D7 ; Common # Sm [63] DOTTED FENCE..BLACK HOURGLASS
+29D8 ; Common # Ps LEFT WIGGLY FENCE
+29D9 ; Common # Pe RIGHT WIGGLY FENCE
+29DA ; Common # Ps LEFT DOUBLE WIGGLY FENCE
+29DB ; Common # Pe RIGHT DOUBLE WIGGLY FENCE
+29DC..29FB ; Common # Sm [32] INCOMPLETE INFINITY..TRIPLE PLUS
+29FC ; Common # Ps LEFT-POINTING CURVED ANGLE BRACKET
+29FD ; Common # Pe RIGHT-POINTING CURVED ANGLE BRACKET
+29FE..2AFF ; Common # Sm [258] TINY..N-ARY WHITE VERTICAL BAR
+2B00..2B2F ; Common # So [48] NORTH EAST WHITE ARROW..WHITE VERTICAL ELLIPSE
+2B30..2B44 ; Common # Sm [21] LEFT ARROW WITH SMALL CIRCLE..RIGHTWARDS ARROW THROUGH SUPERSET
+2B45..2B46 ; Common # So [2] LEFTWARDS QUADRUPLE ARROW..RIGHTWARDS QUADRUPLE ARROW
+2B47..2B4C ; Common # Sm [6] REVERSE TILDE OPERATOR ABOVE RIGHTWARDS ARROW..RIGHTWARDS ARROW ABOVE REVERSE TILDE OPERATOR
+2B4D..2B73 ; Common # So [39] DOWNWARDS TRIANGLE-HEADED ZIGZAG ARROW..DOWNWARDS TRIANGLE-HEADED ARROW TO BAR
+2B76..2B95 ; Common # So [32] NORTH WEST TRIANGLE-HEADED ARROW TO BAR..RIGHTWARDS BLACK ARROW
+2B97..2BFF ; Common # So [105] SYMBOL FOR TYPE A ELECTRONICS..HELLSCHREIBER PAUSE SYMBOL
+2E00..2E01 ; Common # Po [2] RIGHT ANGLE SUBSTITUTION MARKER..RIGHT ANGLE DOTTED SUBSTITUTION MARKER
+2E02 ; Common # Pi LEFT SUBSTITUTION BRACKET
+2E03 ; Common # Pf RIGHT SUBSTITUTION BRACKET
+2E04 ; Common # Pi LEFT DOTTED SUBSTITUTION BRACKET
+2E05 ; Common # Pf RIGHT DOTTED SUBSTITUTION BRACKET
+2E06..2E08 ; Common # Po [3] RAISED INTERPOLATION MARKER..DOTTED TRANSPOSITION MARKER
+2E09 ; Common # Pi LEFT TRANSPOSITION BRACKET
+2E0A ; Common # Pf RIGHT TRANSPOSITION BRACKET
+2E0B ; Common # Po RAISED SQUARE
+2E0C ; Common # Pi LEFT RAISED OMISSION BRACKET
+2E0D ; Common # Pf RIGHT RAISED OMISSION BRACKET
+2E0E..2E16 ; Common # Po [9] EDITORIAL CORONIS..DOTTED RIGHT-POINTING ANGLE
+2E17 ; Common # Pd DOUBLE OBLIQUE HYPHEN
+2E18..2E19 ; Common # Po [2] INVERTED INTERROBANG..PALM BRANCH
+2E1A ; Common # Pd HYPHEN WITH DIAERESIS
+2E1B ; Common # Po TILDE WITH RING ABOVE
+2E1C ; Common # Pi LEFT LOW PARAPHRASE BRACKET
+2E1D ; Common # Pf RIGHT LOW PARAPHRASE BRACKET
+2E1E..2E1F ; Common # Po [2] TILDE WITH DOT ABOVE..TILDE WITH DOT BELOW
+2E20 ; Common # Pi LEFT VERTICAL BAR WITH QUILL
+2E21 ; Common # Pf RIGHT VERTICAL BAR WITH QUILL
+2E22 ; Common # Ps TOP LEFT HALF BRACKET
+2E23 ; Common # Pe TOP RIGHT HALF BRACKET
+2E24 ; Common # Ps BOTTOM LEFT HALF BRACKET
+2E25 ; Common # Pe BOTTOM RIGHT HALF BRACKET
+2E26 ; Common # Ps LEFT SIDEWAYS U BRACKET
+2E27 ; Common # Pe RIGHT SIDEWAYS U BRACKET
+2E28 ; Common # Ps LEFT DOUBLE PARENTHESIS
+2E29 ; Common # Pe RIGHT DOUBLE PARENTHESIS
+2E2A..2E2E ; Common # Po [5] TWO DOTS OVER ONE DOT PUNCTUATION..REVERSED QUESTION MARK
+2E2F ; Common # Lm VERTICAL TILDE
+2E30..2E39 ; Common # Po [10] RING POINT..TOP HALF SECTION SIGN
+2E3A..2E3B ; Common # Pd [2] TWO-EM DASH..THREE-EM DASH
+2E3C..2E3F ; Common # Po [4] STENOGRAPHIC FULL STOP..CAPITULUM
+2E40 ; Common # Pd DOUBLE HYPHEN
+2E41 ; Common # Po REVERSED COMMA
+2E42 ; Common # Ps DOUBLE LOW-REVERSED-9 QUOTATION MARK
+2E43..2E4F ; Common # Po [13] DASH WITH LEFT UPTURN..CORNISH VERSE DIVIDER
+2E50..2E51 ; Common # So [2] CROSS PATTY WITH RIGHT CROSSBAR..CROSS PATTY WITH LEFT CROSSBAR
+2E52..2E54 ; Common # Po [3] TIRONIAN SIGN CAPITAL ET..MEDIEVAL QUESTION MARK
+2E55 ; Common # Ps LEFT SQUARE BRACKET WITH STROKE
+2E56 ; Common # Pe RIGHT SQUARE BRACKET WITH STROKE
+2E57 ; Common # Ps LEFT SQUARE BRACKET WITH DOUBLE STROKE
+2E58 ; Common # Pe RIGHT SQUARE BRACKET WITH DOUBLE STROKE
+2E59 ; Common # Ps TOP HALF LEFT PARENTHESIS
+2E5A ; Common # Pe TOP HALF RIGHT PARENTHESIS
+2E5B ; Common # Ps BOTTOM HALF LEFT PARENTHESIS
+2E5C ; Common # Pe BOTTOM HALF RIGHT PARENTHESIS
+2E5D ; Common # Pd OBLIQUE HYPHEN
+2FF0..2FFF ; Common # So [16] IDEOGRAPHIC DESCRIPTION CHARACTER LEFT TO RIGHT..IDEOGRAPHIC DESCRIPTION CHARACTER ROTATION
+3000 ; Common # Zs IDEOGRAPHIC SPACE
+3001..3003 ; Common # Po [3] IDEOGRAPHIC COMMA..DITTO MARK
+3004 ; Common # So JAPANESE INDUSTRIAL STANDARD SYMBOL
+3006 ; Common # Lo IDEOGRAPHIC CLOSING MARK
+3008 ; Common # Ps LEFT ANGLE BRACKET
+3009 ; Common # Pe RIGHT ANGLE BRACKET
+300A ; Common # Ps LEFT DOUBLE ANGLE BRACKET
+300B ; Common # Pe RIGHT DOUBLE ANGLE BRACKET
+300C ; Common # Ps LEFT CORNER BRACKET
+300D ; Common # Pe RIGHT CORNER BRACKET
+300E ; Common # Ps LEFT WHITE CORNER BRACKET
+300F ; Common # Pe RIGHT WHITE CORNER BRACKET
+3010 ; Common # Ps LEFT BLACK LENTICULAR BRACKET
+3011 ; Common # Pe RIGHT BLACK LENTICULAR BRACKET
+3012..3013 ; Common # So [2] POSTAL MARK..GETA MARK
+3014 ; Common # Ps LEFT TORTOISE SHELL BRACKET
+3015 ; Common # Pe RIGHT TORTOISE SHELL BRACKET
+3016 ; Common # Ps LEFT WHITE LENTICULAR BRACKET
+3017 ; Common # Pe RIGHT WHITE LENTICULAR BRACKET
+3018 ; Common # Ps LEFT WHITE TORTOISE SHELL BRACKET
+3019 ; Common # Pe RIGHT WHITE TORTOISE SHELL BRACKET
+301A ; Common # Ps LEFT WHITE SQUARE BRACKET
+301B ; Common # Pe RIGHT WHITE SQUARE BRACKET
+301C ; Common # Pd WAVE DASH
+301D ; Common # Ps REVERSED DOUBLE PRIME QUOTATION MARK
+301E..301F ; Common # Pe [2] DOUBLE PRIME QUOTATION MARK..LOW DOUBLE PRIME QUOTATION MARK
+3020 ; Common # So POSTAL MARK FACE
+3030 ; Common # Pd WAVY DASH
+3031..3035 ; Common # Lm [5] VERTICAL KANA REPEAT MARK..VERTICAL KANA REPEAT MARK LOWER HALF
+3036..3037 ; Common # So [2] CIRCLED POSTAL MARK..IDEOGRAPHIC TELEGRAPH LINE FEED SEPARATOR SYMBOL
+303C ; Common # Lo MASU MARK
+303D ; Common # Po PART ALTERNATION MARK
+303E..303F ; Common # So [2] IDEOGRAPHIC VARIATION INDICATOR..IDEOGRAPHIC HALF FILL SPACE
+309B..309C ; Common # Sk [2] KATAKANA-HIRAGANA VOICED SOUND MARK..KATAKANA-HIRAGANA SEMI-VOICED SOUND MARK
+30A0 ; Common # Pd KATAKANA-HIRAGANA DOUBLE HYPHEN
+30FB ; Common # Po KATAKANA MIDDLE DOT
+30FC ; Common # Lm KATAKANA-HIRAGANA PROLONGED SOUND MARK
+3190..3191 ; Common # So [2] IDEOGRAPHIC ANNOTATION LINKING MARK..IDEOGRAPHIC ANNOTATION REVERSE MARK
+3192..3195 ; Common # No [4] IDEOGRAPHIC ANNOTATION ONE MARK..IDEOGRAPHIC ANNOTATION FOUR MARK
+3196..319F ; Common # So [10] IDEOGRAPHIC ANNOTATION TOP MARK..IDEOGRAPHIC ANNOTATION MAN MARK
+31C0..31E3 ; Common # So [36] CJK STROKE T..CJK STROKE Q
+31EF ; Common # So IDEOGRAPHIC DESCRIPTION CHARACTER SUBTRACTION
+3220..3229 ; Common # No [10] PARENTHESIZED IDEOGRAPH ONE..PARENTHESIZED IDEOGRAPH TEN
+322A..3247 ; Common # So [30] PARENTHESIZED IDEOGRAPH MOON..CIRCLED IDEOGRAPH KOTO
+3248..324F ; Common # No [8] CIRCLED NUMBER TEN ON BLACK SQUARE..CIRCLED NUMBER EIGHTY ON BLACK SQUARE
+3250 ; Common # So PARTNERSHIP SIGN
+3251..325F ; Common # No [15] CIRCLED NUMBER TWENTY ONE..CIRCLED NUMBER THIRTY FIVE
+327F ; Common # So KOREAN STANDARD SYMBOL
+3280..3289 ; Common # No [10] CIRCLED IDEOGRAPH ONE..CIRCLED IDEOGRAPH TEN
+328A..32B0 ; Common # So [39] CIRCLED IDEOGRAPH MOON..CIRCLED IDEOGRAPH NIGHT
+32B1..32BF ; Common # No [15] CIRCLED NUMBER THIRTY SIX..CIRCLED NUMBER FIFTY
+32C0..32CF ; Common # So [16] IDEOGRAPHIC TELEGRAPH SYMBOL FOR JANUARY..LIMITED LIABILITY SIGN
+32FF ; Common # So SQUARE ERA NAME REIWA
+3358..33FF ; Common # So [168] IDEOGRAPHIC TELEGRAPH SYMBOL FOR HOUR ZERO..SQUARE GAL
+4DC0..4DFF ; Common # So [64] HEXAGRAM FOR THE CREATIVE HEAVEN..HEXAGRAM FOR BEFORE COMPLETION
+A700..A716 ; Common # Sk [23] MODIFIER LETTER CHINESE TONE YIN PING..MODIFIER LETTER EXTRA-LOW LEFT-STEM TONE BAR
+A717..A71F ; Common # Lm [9] MODIFIER LETTER DOT VERTICAL BAR..MODIFIER LETTER LOW INVERTED EXCLAMATION MARK
+A720..A721 ; Common # Sk [2] MODIFIER LETTER STRESS AND HIGH TONE..MODIFIER LETTER STRESS AND LOW TONE
+A788 ; Common # Lm MODIFIER LETTER LOW CIRCUMFLEX ACCENT
+A789..A78A ; Common # Sk [2] MODIFIER LETTER COLON..MODIFIER LETTER SHORT EQUALS SIGN
+A830..A835 ; Common # No [6] NORTH INDIC FRACTION ONE QUARTER..NORTH INDIC FRACTION THREE SIXTEENTHS
+A836..A837 ; Common # So [2] NORTH INDIC QUARTER MARK..NORTH INDIC PLACEHOLDER MARK
+A838 ; Common # Sc NORTH INDIC RUPEE MARK
+A839 ; Common # So NORTH INDIC QUANTITY MARK
+A92E ; Common # Po KAYAH LI SIGN CWI
+A9CF ; Common # Lm JAVANESE PANGRANGKEP
+AB5B ; Common # Sk MODIFIER BREVE WITH INVERTED BREVE
+AB6A..AB6B ; Common # Sk [2] MODIFIER LETTER LEFT TACK..MODIFIER LETTER RIGHT TACK
+FD3E ; Common # Pe ORNATE LEFT PARENTHESIS
+FD3F ; Common # Ps ORNATE RIGHT PARENTHESIS
+FE10..FE16 ; Common # Po [7] PRESENTATION FORM FOR VERTICAL COMMA..PRESENTATION FORM FOR VERTICAL QUESTION MARK
+FE17 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE LENTICULAR BRACKET
+FE18 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT WHITE LENTICULAR BRAKCET
+FE19 ; Common # Po PRESENTATION FORM FOR VERTICAL HORIZONTAL ELLIPSIS
+FE30 ; Common # Po PRESENTATION FORM FOR VERTICAL TWO DOT LEADER
+FE31..FE32 ; Common # Pd [2] PRESENTATION FORM FOR VERTICAL EM DASH..PRESENTATION FORM FOR VERTICAL EN DASH
+FE33..FE34 ; Common # Pc [2] PRESENTATION FORM FOR VERTICAL LOW LINE..PRESENTATION FORM FOR VERTICAL WAVY LOW LINE
+FE35 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT PARENTHESIS
+FE36 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT PARENTHESIS
+FE37 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT CURLY BRACKET
+FE38 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT CURLY BRACKET
+FE39 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT TORTOISE SHELL BRACKET
+FE3A ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT TORTOISE SHELL BRACKET
+FE3B ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT BLACK LENTICULAR BRACKET
+FE3C ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT BLACK LENTICULAR BRACKET
+FE3D ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT DOUBLE ANGLE BRACKET
+FE3E ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT DOUBLE ANGLE BRACKET
+FE3F ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT ANGLE BRACKET
+FE40 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT ANGLE BRACKET
+FE41 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT CORNER BRACKET
+FE42 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT CORNER BRACKET
+FE43 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT WHITE CORNER BRACKET
+FE44 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT WHITE CORNER BRACKET
+FE45..FE46 ; Common # Po [2] SESAME DOT..WHITE SESAME DOT
+FE47 ; Common # Ps PRESENTATION FORM FOR VERTICAL LEFT SQUARE BRACKET
+FE48 ; Common # Pe PRESENTATION FORM FOR VERTICAL RIGHT SQUARE BRACKET
+FE49..FE4C ; Common # Po [4] DASHED OVERLINE..DOUBLE WAVY OVERLINE
+FE4D..FE4F ; Common # Pc [3] DASHED LOW LINE..WAVY LOW LINE
+FE50..FE52 ; Common # Po [3] SMALL COMMA..SMALL FULL STOP
+FE54..FE57 ; Common # Po [4] SMALL SEMICOLON..SMALL EXCLAMATION MARK
+FE58 ; Common # Pd SMALL EM DASH
+FE59 ; Common # Ps SMALL LEFT PARENTHESIS
+FE5A ; Common # Pe SMALL RIGHT PARENTHESIS
+FE5B ; Common # Ps SMALL LEFT CURLY BRACKET
+FE5C ; Common # Pe SMALL RIGHT CURLY BRACKET
+FE5D ; Common # Ps SMALL LEFT TORTOISE SHELL BRACKET
+FE5E ; Common # Pe SMALL RIGHT TORTOISE SHELL BRACKET
+FE5F..FE61 ; Common # Po [3] SMALL NUMBER SIGN..SMALL ASTERISK
+FE62 ; Common # Sm SMALL PLUS SIGN
+FE63 ; Common # Pd SMALL HYPHEN-MINUS
+FE64..FE66 ; Common # Sm [3] SMALL LESS-THAN SIGN..SMALL EQUALS SIGN
+FE68 ; Common # Po SMALL REVERSE SOLIDUS
+FE69 ; Common # Sc SMALL DOLLAR SIGN
+FE6A..FE6B ; Common # Po [2] SMALL PERCENT SIGN..SMALL COMMERCIAL AT
+FEFF ; Common # Cf ZERO WIDTH NO-BREAK SPACE
+FF01..FF03 ; Common # Po [3] FULLWIDTH EXCLAMATION MARK..FULLWIDTH NUMBER SIGN
+FF04 ; Common # Sc FULLWIDTH DOLLAR SIGN
+FF05..FF07 ; Common # Po [3] FULLWIDTH PERCENT SIGN..FULLWIDTH APOSTROPHE
+FF08 ; Common # Ps FULLWIDTH LEFT PARENTHESIS
+FF09 ; Common # Pe FULLWIDTH RIGHT PARENTHESIS
+FF0A ; Common # Po FULLWIDTH ASTERISK
+FF0B ; Common # Sm FULLWIDTH PLUS SIGN
+FF0C ; Common # Po FULLWIDTH COMMA
+FF0D ; Common # Pd FULLWIDTH HYPHEN-MINUS
+FF0E..FF0F ; Common # Po [2] FULLWIDTH FULL STOP..FULLWIDTH SOLIDUS
+FF10..FF19 ; Common # Nd [10] FULLWIDTH DIGIT ZERO..FULLWIDTH DIGIT NINE
+FF1A..FF1B ; Common # Po [2] FULLWIDTH COLON..FULLWIDTH SEMICOLON
+FF1C..FF1E ; Common # Sm [3] FULLWIDTH LESS-THAN SIGN..FULLWIDTH GREATER-THAN SIGN
+FF1F..FF20 ; Common # Po [2] FULLWIDTH QUESTION MARK..FULLWIDTH COMMERCIAL AT
+FF3B ; Common # Ps FULLWIDTH LEFT SQUARE BRACKET
+FF3C ; Common # Po FULLWIDTH REVERSE SOLIDUS
+FF3D ; Common # Pe FULLWIDTH RIGHT SQUARE BRACKET
+FF3E ; Common # Sk FULLWIDTH CIRCUMFLEX ACCENT
+FF3F ; Common # Pc FULLWIDTH LOW LINE
+FF40 ; Common # Sk FULLWIDTH GRAVE ACCENT
+FF5B ; Common # Ps FULLWIDTH LEFT CURLY BRACKET
+FF5C ; Common # Sm FULLWIDTH VERTICAL LINE
+FF5D ; Common # Pe FULLWIDTH RIGHT CURLY BRACKET
+FF5E ; Common # Sm FULLWIDTH TILDE
+FF5F ; Common # Ps FULLWIDTH LEFT WHITE PARENTHESIS
+FF60 ; Common # Pe FULLWIDTH RIGHT WHITE PARENTHESIS
+FF61 ; Common # Po HALFWIDTH IDEOGRAPHIC FULL STOP
+FF62 ; Common # Ps HALFWIDTH LEFT CORNER BRACKET
+FF63 ; Common # Pe HALFWIDTH RIGHT CORNER BRACKET
+FF64..FF65 ; Common # Po [2] HALFWIDTH IDEOGRAPHIC COMMA..HALFWIDTH KATAKANA MIDDLE DOT
+FF70 ; Common # Lm HALFWIDTH KATAKANA-HIRAGANA PROLONGED SOUND MARK
+FF9E..FF9F ; Common # Lm [2] HALFWIDTH KATAKANA VOICED SOUND MARK..HALFWIDTH KATAKANA SEMI-VOICED SOUND MARK
+FFE0..FFE1 ; Common # Sc [2] FULLWIDTH CENT SIGN..FULLWIDTH POUND SIGN
+FFE2 ; Common # Sm FULLWIDTH NOT SIGN
+FFE3 ; Common # Sk FULLWIDTH MACRON
+FFE4 ; Common # So FULLWIDTH BROKEN BAR
+FFE5..FFE6 ; Common # Sc [2] FULLWIDTH YEN SIGN..FULLWIDTH WON SIGN
+FFE8 ; Common # So HALFWIDTH FORMS LIGHT VERTICAL
+FFE9..FFEC ; Common # Sm [4] HALFWIDTH LEFTWARDS ARROW..HALFWIDTH DOWNWARDS ARROW
+FFED..FFEE ; Common # So [2] HALFWIDTH BLACK SQUARE..HALFWIDTH WHITE CIRCLE
+FFF9..FFFB ; Common # Cf [3] INTERLINEAR ANNOTATION ANCHOR..INTERLINEAR ANNOTATION TERMINATOR
+FFFC..FFFD ; Common # So [2] OBJECT REPLACEMENT CHARACTER..REPLACEMENT CHARACTER
+10100..10102 ; Common # Po [3] AEGEAN WORD SEPARATOR LINE..AEGEAN CHECK MARK
+10107..10133 ; Common # No [45] AEGEAN NUMBER ONE..AEGEAN NUMBER NINETY THOUSAND
+10137..1013F ; Common # So [9] AEGEAN WEIGHT BASE UNIT..AEGEAN MEASURE THIRD SUBUNIT
+10190..1019C ; Common # So [13] ROMAN SEXTANS SIGN..ASCIA SYMBOL
+101D0..101FC ; Common # So [45] PHAISTOS DISC SIGN PEDESTRIAN..PHAISTOS DISC SIGN WAVY BAND
+102E1..102FB ; Common # No [27] COPTIC EPACT DIGIT ONE..COPTIC EPACT NUMBER NINE HUNDRED
+1BCA0..1BCA3 ; Common # Cf [4] SHORTHAND FORMAT LETTER OVERLAP..SHORTHAND FORMAT UP STEP
+1CF50..1CFC3 ; Common # So [116] ZNAMENNY NEUME KRYUK..ZNAMENNY NEUME PAUK
+1D000..1D0F5 ; Common # So [246] BYZANTINE MUSICAL SYMBOL PSILI..BYZANTINE MUSICAL SYMBOL GORGON NEO KATO
+1D100..1D126 ; Common # So [39] MUSICAL SYMBOL SINGLE BARLINE..MUSICAL SYMBOL DRUM CLEF-2
+1D129..1D164 ; Common # So [60] MUSICAL SYMBOL MULTIPLE MEASURE REST..MUSICAL SYMBOL ONE HUNDRED TWENTY-EIGHTH NOTE
+1D165..1D166 ; Common # Mc [2] MUSICAL SYMBOL COMBINING STEM..MUSICAL SYMBOL COMBINING SPRECHGESANG STEM
+1D16A..1D16C ; Common # So [3] MUSICAL SYMBOL FINGERED TREMOLO-1..MUSICAL SYMBOL FINGERED TREMOLO-3
+1D16D..1D172 ; Common # Mc [6] MUSICAL SYMBOL COMBINING AUGMENTATION DOT..MUSICAL SYMBOL COMBINING FLAG-5
+1D173..1D17A ; Common # Cf [8] MUSICAL SYMBOL BEGIN BEAM..MUSICAL SYMBOL END PHRASE
+1D183..1D184 ; Common # So [2] MUSICAL SYMBOL ARPEGGIATO UP..MUSICAL SYMBOL ARPEGGIATO DOWN
+1D18C..1D1A9 ; Common # So [30] MUSICAL SYMBOL RINFORZANDO..MUSICAL SYMBOL DEGREE SLASH
+1D1AE..1D1EA ; Common # So [61] MUSICAL SYMBOL PEDAL MARK..MUSICAL SYMBOL KORON
+1D2C0..1D2D3 ; Common # No [20] KAKTOVIK NUMERAL ZERO..KAKTOVIK NUMERAL NINETEEN
+1D2E0..1D2F3 ; Common # No [20] MAYAN NUMERAL ZERO..MAYAN NUMERAL NINETEEN
+1D300..1D356 ; Common # So [87] MONOGRAM FOR EARTH..TETRAGRAM FOR FOSTERING
+1D360..1D378 ; Common # No [25] COUNTING ROD UNIT DIGIT ONE..TALLY MARK FIVE
+1D400..1D454 ; Common # L& [85] MATHEMATICAL BOLD CAPITAL A..MATHEMATICAL ITALIC SMALL G
+1D456..1D49C ; Common # L& [71] MATHEMATICAL ITALIC SMALL I..MATHEMATICAL SCRIPT CAPITAL A
+1D49E..1D49F ; Common # L& [2] MATHEMATICAL SCRIPT CAPITAL C..MATHEMATICAL SCRIPT CAPITAL D
+1D4A2 ; Common # L& MATHEMATICAL SCRIPT CAPITAL G
+1D4A5..1D4A6 ; Common # L& [2] MATHEMATICAL SCRIPT CAPITAL J..MATHEMATICAL SCRIPT CAPITAL K
+1D4A9..1D4AC ; Common # L& [4] MATHEMATICAL SCRIPT CAPITAL N..MATHEMATICAL SCRIPT CAPITAL Q
+1D4AE..1D4B9 ; Common # L& [12] MATHEMATICAL SCRIPT CAPITAL S..MATHEMATICAL SCRIPT SMALL D
+1D4BB ; Common # L& MATHEMATICAL SCRIPT SMALL F
+1D4BD..1D4C3 ; Common # L& [7] MATHEMATICAL SCRIPT SMALL H..MATHEMATICAL SCRIPT SMALL N
+1D4C5..1D505 ; Common # L& [65] MATHEMATICAL SCRIPT SMALL P..MATHEMATICAL FRAKTUR CAPITAL B
+1D507..1D50A ; Common # L& [4] MATHEMATICAL FRAKTUR CAPITAL D..MATHEMATICAL FRAKTUR CAPITAL G
+1D50D..1D514 ; Common # L& [8] MATHEMATICAL FRAKTUR CAPITAL J..MATHEMATICAL FRAKTUR CAPITAL Q
+1D516..1D51C ; Common # L& [7] MATHEMATICAL FRAKTUR CAPITAL S..MATHEMATICAL FRAKTUR CAPITAL Y
+1D51E..1D539 ; Common # L& [28] MATHEMATICAL FRAKTUR SMALL A..MATHEMATICAL DOUBLE-STRUCK CAPITAL B
+1D53B..1D53E ; Common # L& [4] MATHEMATICAL DOUBLE-STRUCK CAPITAL D..MATHEMATICAL DOUBLE-STRUCK CAPITAL G
+1D540..1D544 ; Common # L& [5] MATHEMATICAL DOUBLE-STRUCK CAPITAL I..MATHEMATICAL DOUBLE-STRUCK CAPITAL M
+1D546 ; Common # L& MATHEMATICAL DOUBLE-STRUCK CAPITAL O
+1D54A..1D550 ; Common # L& [7] MATHEMATICAL DOUBLE-STRUCK CAPITAL S..MATHEMATICAL DOUBLE-STRUCK CAPITAL Y
+1D552..1D6A5 ; Common # L& [340] MATHEMATICAL DOUBLE-STRUCK SMALL A..MATHEMATICAL ITALIC SMALL DOTLESS J
+1D6A8..1D6C0 ; Common # L& [25] MATHEMATICAL BOLD CAPITAL ALPHA..MATHEMATICAL BOLD CAPITAL OMEGA
+1D6C1 ; Common # Sm MATHEMATICAL BOLD NABLA
+1D6C2..1D6DA ; Common # L& [25] MATHEMATICAL BOLD SMALL ALPHA..MATHEMATICAL BOLD SMALL OMEGA
+1D6DB ; Common # Sm MATHEMATICAL BOLD PARTIAL DIFFERENTIAL
+1D6DC..1D6FA ; Common # L& [31] MATHEMATICAL BOLD EPSILON SYMBOL..MATHEMATICAL ITALIC CAPITAL OMEGA
+1D6FB ; Common # Sm MATHEMATICAL ITALIC NABLA
+1D6FC..1D714 ; Common # L& [25] MATHEMATICAL ITALIC SMALL ALPHA..MATHEMATICAL ITALIC SMALL OMEGA
+1D715 ; Common # Sm MATHEMATICAL ITALIC PARTIAL DIFFERENTIAL
+1D716..1D734 ; Common # L& [31] MATHEMATICAL ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD ITALIC CAPITAL OMEGA
+1D735 ; Common # Sm MATHEMATICAL BOLD ITALIC NABLA
+1D736..1D74E ; Common # L& [25] MATHEMATICAL BOLD ITALIC SMALL ALPHA..MATHEMATICAL BOLD ITALIC SMALL OMEGA
+1D74F ; Common # Sm MATHEMATICAL BOLD ITALIC PARTIAL DIFFERENTIAL
+1D750..1D76E ; Common # L& [31] MATHEMATICAL BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD CAPITAL OMEGA
+1D76F ; Common # Sm MATHEMATICAL SANS-SERIF BOLD NABLA
+1D770..1D788 ; Common # L& [25] MATHEMATICAL SANS-SERIF BOLD SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD SMALL OMEGA
+1D789 ; Common # Sm MATHEMATICAL SANS-SERIF BOLD PARTIAL DIFFERENTIAL
+1D78A..1D7A8 ; Common # L& [31] MATHEMATICAL SANS-SERIF BOLD EPSILON SYMBOL..MATHEMATICAL SANS-SERIF BOLD ITALIC CAPITAL OMEGA
+1D7A9 ; Common # Sm MATHEMATICAL SANS-SERIF BOLD ITALIC NABLA
+1D7AA..1D7C2 ; Common # L& [25] MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL ALPHA..MATHEMATICAL SANS-SERIF BOLD ITALIC SMALL OMEGA
+1D7C3 ; Common # Sm MATHEMATICAL SANS-SERIF BOLD ITALIC PARTIAL DIFFERENTIAL
+1D7C4..1D7CB ; Common # L& [8] MATHEMATICAL SANS-SERIF BOLD ITALIC EPSILON SYMBOL..MATHEMATICAL BOLD SMALL DIGAMMA
+1D7CE..1D7FF ; Common # Nd [50] MATHEMATICAL BOLD DIGIT ZERO..MATHEMATICAL MONOSPACE DIGIT NINE
+1EC71..1ECAB ; Common # No [59] INDIC SIYAQ NUMBER ONE..INDIC SIYAQ NUMBER PREFIXED NINE
+1ECAC ; Common # So INDIC SIYAQ PLACEHOLDER
+1ECAD..1ECAF ; Common # No [3] INDIC SIYAQ FRACTION ONE QUARTER..INDIC SIYAQ FRACTION THREE QUARTERS
+1ECB0 ; Common # Sc INDIC SIYAQ RUPEE MARK
+1ECB1..1ECB4 ; Common # No [4] INDIC SIYAQ NUMBER ALTERNATE ONE..INDIC SIYAQ ALTERNATE LAKH MARK
+1ED01..1ED2D ; Common # No [45] OTTOMAN SIYAQ NUMBER ONE..OTTOMAN SIYAQ NUMBER NINETY THOUSAND
+1ED2E ; Common # So OTTOMAN SIYAQ MARRATAN
+1ED2F..1ED3D ; Common # No [15] OTTOMAN SIYAQ ALTERNATE NUMBER TWO..OTTOMAN SIYAQ FRACTION ONE SIXTH
+1F000..1F02B ; Common # So [44] MAHJONG TILE EAST WIND..MAHJONG TILE BACK
+1F030..1F093 ; Common # So [100] DOMINO TILE HORIZONTAL BACK..DOMINO TILE VERTICAL-06-06
+1F0A0..1F0AE ; Common # So [15] PLAYING CARD BACK..PLAYING CARD KING OF SPADES
+1F0B1..1F0BF ; Common # So [15] PLAYING CARD ACE OF HEARTS..PLAYING CARD RED JOKER
+1F0C1..1F0CF ; Common # So [15] PLAYING CARD ACE OF DIAMONDS..PLAYING CARD BLACK JOKER
+1F0D1..1F0F5 ; Common # So [37] PLAYING CARD ACE OF CLUBS..PLAYING CARD TRUMP-21
+1F100..1F10C ; Common # No [13] DIGIT ZERO FULL STOP..DINGBAT NEGATIVE CIRCLED SANS-SERIF DIGIT ZERO
+1F10D..1F1AD ; Common # So [161] CIRCLED ZERO WITH SLASH..MASK WORK SYMBOL
+1F1E6..1F1FF ; Common # So [26] REGIONAL INDICATOR SYMBOL LETTER A..REGIONAL INDICATOR SYMBOL LETTER Z
+1F201..1F202 ; Common # So [2] SQUARED KATAKANA KOKO..SQUARED KATAKANA SA
+1F210..1F23B ; Common # So [44] SQUARED CJK UNIFIED IDEOGRAPH-624B..SQUARED CJK UNIFIED IDEOGRAPH-914D
+1F240..1F248 ; Common # So [9] TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-672C..TORTOISE SHELL BRACKETED CJK UNIFIED IDEOGRAPH-6557
+1F250..1F251 ; Common # So [2] CIRCLED IDEOGRAPH ADVANTAGE..CIRCLED IDEOGRAPH ACCEPT
+1F260..1F265 ; Common # So [6] ROUNDED SYMBOL FOR FU..ROUNDED SYMBOL FOR CAI
+1F300..1F3FA ; Common # So [251] CYCLONE..AMPHORA
+1F3FB..1F3FF ; Common # Sk [5] EMOJI MODIFIER FITZPATRICK TYPE-1-2..EMOJI MODIFIER FITZPATRICK TYPE-6
+1F400..1F6D7 ; Common # So [728] RAT..ELEVATOR
+1F6DC..1F6EC ; Common # So [17] WIRELESS..AIRPLANE ARRIVING
+1F6F0..1F6FC ; Common # So [13] SATELLITE..ROLLER SKATE
+1F700..1F776 ; Common # So [119] ALCHEMICAL SYMBOL FOR QUINTESSENCE..LUNAR ECLIPSE
+1F77B..1F7D9 ; Common # So [95] HAUMEA..NINE POINTED WHITE STAR
+1F7E0..1F7EB ; Common # So [12] LARGE ORANGE CIRCLE..LARGE BROWN SQUARE
+1F7F0 ; Common # So HEAVY EQUALS SIGN
+1F800..1F80B ; Common # So [12] LEFTWARDS ARROW WITH SMALL TRIANGLE ARROWHEAD..DOWNWARDS ARROW WITH LARGE TRIANGLE ARROWHEAD
+1F810..1F847 ; Common # So [56] LEFTWARDS ARROW WITH SMALL EQUILATERAL ARROWHEAD..DOWNWARDS HEAVY ARROW
+1F850..1F859 ; Common # So [10] LEFTWARDS SANS-SERIF ARROW..UP DOWN SANS-SERIF ARROW
+1F860..1F887 ; Common # So [40] WIDE-HEADED LEFTWARDS LIGHT BARB ARROW..WIDE-HEADED SOUTH WEST VERY HEAVY BARB ARROW
+1F890..1F8AD ; Common # So [30] LEFTWARDS TRIANGLE ARROWHEAD..WHITE ARROW SHAFT WIDTH TWO THIRDS
+1F8B0..1F8B1 ; Common # So [2] ARROW POINTING UPWARDS THEN NORTH WEST..ARROW POINTING RIGHTWARDS THEN CURVING SOUTH WEST
+1F900..1FA53 ; Common # So [340] CIRCLED CROSS FORMEE WITH FOUR DOTS..BLACK CHESS KNIGHT-BISHOP
+1FA60..1FA6D ; Common # So [14] XIANGQI RED GENERAL..XIANGQI BLACK SOLDIER
+1FA70..1FA7C ; Common # So [13] BALLET SHOES..CRUTCH
+1FA80..1FA88 ; Common # So [9] YO-YO..FLUTE
+1FA90..1FABD ; Common # So [46] RINGED PLANET..WING
+1FABF..1FAC5 ; Common # So [7] GOOSE..PERSON WITH CROWN
+1FACE..1FADB ; Common # So [14] MOOSE..PEA POD
+1FAE0..1FAE8 ; Common # So [9] MELTING FACE..SHAKING FACE
+1FAF0..1FAF8 ; Common # So [9] HAND WITH INDEX FINGER AND THUMB CROSSED..RIGHTWARDS PUSHING HAND
+1FB00..1FB92 ; Common # So [147] BLOCK SEXTANT-1..UPPER HALF INVERSE MEDIUM SHADE AND LOWER HALF BLOCK
+1FB94..1FBCA ; Common # So [55] LEFT HALF INVERSE MEDIUM SHADE AND RIGHT HALF BLOCK..WHITE UP-POINTING CHEVRON
+1FBF0..1FBF9 ; Common # Nd [10] SEGMENTED DIGIT ZERO..SEGMENTED DIGIT NINE
+E0001 ; Common # Cf LANGUAGE TAG
+E0020..E007F ; Common # Cf [96] TAG SPACE..CANCEL TAG
+
+# Total code points: 8306
+
+# ================================================
+
+0041..005A ; Latin # L& [26] LATIN CAPITAL LETTER A..LATIN CAPITAL LETTER Z
+0061..007A ; Latin # L& [26] LATIN SMALL LETTER A..LATIN SMALL LETTER Z
+00AA ; Latin # Lo FEMININE ORDINAL INDICATOR
+00BA ; Latin # Lo MASCULINE ORDINAL INDICATOR
+00C0..00D6 ; Latin # L& [23] LATIN CAPITAL LETTER A WITH GRAVE..LATIN CAPITAL LETTER O WITH DIAERESIS
+00D8..00F6 ; Latin # L& [31] LATIN CAPITAL LETTER O WITH STROKE..LATIN SMALL LETTER O WITH DIAERESIS
+00F8..01BA ; Latin # L& [195] LATIN SMALL LETTER O WITH STROKE..LATIN SMALL LETTER EZH WITH TAIL
+01BB ; Latin # Lo LATIN LETTER TWO WITH STROKE
+01BC..01BF ; Latin # L& [4] LATIN CAPITAL LETTER TONE FIVE..LATIN LETTER WYNN
+01C0..01C3 ; Latin # Lo [4] LATIN LETTER DENTAL CLICK..LATIN LETTER RETROFLEX CLICK
+01C4..0293 ; Latin # L& [208] LATIN CAPITAL LETTER DZ WITH CARON..LATIN SMALL LETTER EZH WITH CURL
+0294 ; Latin # Lo LATIN LETTER GLOTTAL STOP
+0295..02AF ; Latin # L& [27] LATIN LETTER PHARYNGEAL VOICED FRICATIVE..LATIN SMALL LETTER TURNED H WITH FISHHOOK AND TAIL
+02B0..02B8 ; Latin # Lm [9] MODIFIER LETTER SMALL H..MODIFIER LETTER SMALL Y
+02E0..02E4 ; Latin # Lm [5] MODIFIER LETTER SMALL GAMMA..MODIFIER LETTER SMALL REVERSED GLOTTAL STOP
+1D00..1D25 ; Latin # L& [38] LATIN LETTER SMALL CAPITAL A..LATIN LETTER AIN
+1D2C..1D5C ; Latin # Lm [49] MODIFIER LETTER CAPITAL A..MODIFIER LETTER SMALL AIN
+1D62..1D65 ; Latin # Lm [4] LATIN SUBSCRIPT SMALL LETTER I..LATIN SUBSCRIPT SMALL LETTER V
+1D6B..1D77 ; Latin # L& [13] LATIN SMALL LETTER UE..LATIN SMALL LETTER TURNED G
+1D79..1D9A ; Latin # L& [34] LATIN SMALL LETTER INSULAR G..LATIN SMALL LETTER EZH WITH RETROFLEX HOOK
+1D9B..1DBE ; Latin # Lm [36] MODIFIER LETTER SMALL TURNED ALPHA..MODIFIER LETTER SMALL EZH
+1E00..1EFF ; Latin # L& [256] LATIN CAPITAL LETTER A WITH RING BELOW..LATIN SMALL LETTER Y WITH LOOP
+2071 ; Latin # Lm SUPERSCRIPT LATIN SMALL LETTER I
+207F ; Latin # Lm SUPERSCRIPT LATIN SMALL LETTER N
+2090..209C ; Latin # Lm [13] LATIN SUBSCRIPT SMALL LETTER A..LATIN SUBSCRIPT SMALL LETTER T
+212A..212B ; Latin # L& [2] KELVIN SIGN..ANGSTROM SIGN
+2132 ; Latin # L& TURNED CAPITAL F
+214E ; Latin # L& TURNED SMALL F
+2160..2182 ; Latin # Nl [35] ROMAN NUMERAL ONE..ROMAN NUMERAL TEN THOUSAND
+2183..2184 ; Latin # L& [2] ROMAN NUMERAL REVERSED ONE HUNDRED..LATIN SMALL LETTER REVERSED C
+2185..2188 ; Latin # Nl [4] ROMAN NUMERAL SIX LATE FORM..ROMAN NUMERAL ONE HUNDRED THOUSAND
+2C60..2C7B ; Latin # L& [28] LATIN CAPITAL LETTER L WITH DOUBLE BAR..LATIN LETTER SMALL CAPITAL TURNED E
+2C7C..2C7D ; Latin # Lm [2] LATIN SUBSCRIPT SMALL LETTER J..MODIFIER LETTER CAPITAL V
+2C7E..2C7F ; Latin # L& [2] LATIN CAPITAL LETTER S WITH SWASH TAIL..LATIN CAPITAL LETTER Z WITH SWASH TAIL
+A722..A76F ; Latin # L& [78] LATIN CAPITAL LETTER EGYPTOLOGICAL ALEF..LATIN SMALL LETTER CON
+A770 ; Latin # Lm MODIFIER LETTER US
+A771..A787 ; Latin # L& [23] LATIN SMALL LETTER DUM..LATIN SMALL LETTER INSULAR T
+A78B..A78E ; Latin # L& [4] LATIN CAPITAL LETTER SALTILLO..LATIN SMALL LETTER L WITH RETROFLEX HOOK AND BELT
+A78F ; Latin # Lo LATIN LETTER SINOLOGICAL DOT
+A790..A7CA ; Latin # L& [59] LATIN CAPITAL LETTER N WITH DESCENDER..LATIN SMALL LETTER S WITH SHORT STROKE OVERLAY
+A7D0..A7D1 ; Latin # L& [2] LATIN CAPITAL LETTER CLOSED INSULAR G..LATIN SMALL LETTER CLOSED INSULAR G
+A7D3 ; Latin # L& LATIN SMALL LETTER DOUBLE THORN
+A7D5..A7D9 ; Latin # L& [5] LATIN SMALL LETTER DOUBLE WYNN..LATIN SMALL LETTER SIGMOID S
+A7F2..A7F4 ; Latin # Lm [3] MODIFIER LETTER CAPITAL C..MODIFIER LETTER CAPITAL Q
+A7F5..A7F6 ; Latin # L& [2] LATIN CAPITAL LETTER REVERSED HALF H..LATIN SMALL LETTER REVERSED HALF H
+A7F7 ; Latin # Lo LATIN EPIGRAPHIC LETTER SIDEWAYS I
+A7F8..A7F9 ; Latin # Lm [2] MODIFIER LETTER CAPITAL H WITH STROKE..MODIFIER LETTER SMALL LIGATURE OE
+A7FA ; Latin # L& LATIN LETTER SMALL CAPITAL TURNED M
+A7FB..A7FF ; Latin # Lo [5] LATIN EPIGRAPHIC LETTER REVERSED F..LATIN EPIGRAPHIC LETTER ARCHAIC M
+AB30..AB5A ; Latin # L& [43] LATIN SMALL LETTER BARRED ALPHA..LATIN SMALL LETTER Y WITH SHORT RIGHT LEG
+AB5C..AB5F ; Latin # Lm [4] MODIFIER LETTER SMALL HENG..MODIFIER LETTER SMALL U WITH LEFT HOOK
+AB60..AB64 ; Latin # L& [5] LATIN SMALL LETTER SAKHA YAT..LATIN SMALL LETTER INVERTED ALPHA
+AB66..AB68 ; Latin # L& [3] LATIN SMALL LETTER DZ DIGRAPH WITH RETROFLEX HOOK..LATIN SMALL LETTER TURNED R WITH MIDDLE TILDE
+AB69 ; Latin # Lm MODIFIER LETTER SMALL TURNED W
+FB00..FB06 ; Latin # L& [7] LATIN SMALL LIGATURE FF..LATIN SMALL LIGATURE ST
+FF21..FF3A ; Latin # L& [26] FULLWIDTH LATIN CAPITAL LETTER A..FULLWIDTH LATIN CAPITAL LETTER Z
+FF41..FF5A ; Latin # L& [26] FULLWIDTH LATIN SMALL LETTER A..FULLWIDTH LATIN SMALL LETTER Z
+10780..10785 ; Latin # Lm [6] MODIFIER LETTER SMALL CAPITAL AA..MODIFIER LETTER SMALL B WITH HOOK
+10787..107B0 ; Latin # Lm [42] MODIFIER LETTER SMALL DZ DIGRAPH..MODIFIER LETTER SMALL V WITH RIGHT HOOK
+107B2..107BA ; Latin # Lm [9] MODIFIER LETTER SMALL CAPITAL Y..MODIFIER LETTER SMALL S WITH CURL
+1DF00..1DF09 ; Latin # L& [10] LATIN SMALL LETTER FENG DIGRAPH WITH TRILL..LATIN SMALL LETTER T WITH HOOK AND RETROFLEX HOOK
+1DF0A ; Latin # Lo LATIN LETTER RETROFLEX CLICK WITH RETROFLEX HOOK
+1DF0B..1DF1E ; Latin # L& [20] LATIN SMALL LETTER ESH WITH DOUBLE BAR..LATIN SMALL LETTER S WITH CURL
+1DF25..1DF2A ; Latin # L& [6] LATIN SMALL LETTER D WITH MID-HEIGHT LEFT HOOK..LATIN SMALL LETTER T WITH MID-HEIGHT LEFT HOOK
+
+# Total code points: 1481
+
+# ================================================
+
+0370..0373 ; Greek # L& [4] GREEK CAPITAL LETTER HETA..GREEK SMALL LETTER ARCHAIC SAMPI
+0375 ; Greek # Sk GREEK LOWER NUMERAL SIGN
+0376..0377 ; Greek # L& [2] GREEK CAPITAL LETTER PAMPHYLIAN DIGAMMA..GREEK SMALL LETTER PAMPHYLIAN DIGAMMA
+037A ; Greek # Lm GREEK YPOGEGRAMMENI
+037B..037D ; Greek # L& [3] GREEK SMALL REVERSED LUNATE SIGMA SYMBOL..GREEK SMALL REVERSED DOTTED LUNATE SIGMA SYMBOL
+037F ; Greek # L& GREEK CAPITAL LETTER YOT
+0384 ; Greek # Sk GREEK TONOS
+0386 ; Greek # L& GREEK CAPITAL LETTER ALPHA WITH TONOS
+0388..038A ; Greek # L& [3] GREEK CAPITAL LETTER EPSILON WITH TONOS..GREEK CAPITAL LETTER IOTA WITH TONOS
+038C ; Greek # L& GREEK CAPITAL LETTER OMICRON WITH TONOS
+038E..03A1 ; Greek # L& [20] GREEK CAPITAL LETTER UPSILON WITH TONOS..GREEK CAPITAL LETTER RHO
+03A3..03E1 ; Greek # L& [63] GREEK CAPITAL LETTER SIGMA..GREEK SMALL LETTER SAMPI
+03F0..03F5 ; Greek # L& [6] GREEK KAPPA SYMBOL..GREEK LUNATE EPSILON SYMBOL
+03F6 ; Greek # Sm GREEK REVERSED LUNATE EPSILON SYMBOL
+03F7..03FF ; Greek # L& [9] GREEK CAPITAL LETTER SHO..GREEK CAPITAL REVERSED DOTTED LUNATE SIGMA SYMBOL
+1D26..1D2A ; Greek # L& [5] GREEK LETTER SMALL CAPITAL GAMMA..GREEK LETTER SMALL CAPITAL PSI
+1D5D..1D61 ; Greek # Lm [5] MODIFIER LETTER SMALL BETA..MODIFIER LETTER SMALL CHI
+1D66..1D6A ; Greek # Lm [5] GREEK SUBSCRIPT SMALL LETTER BETA..GREEK SUBSCRIPT SMALL LETTER CHI
+1DBF ; Greek # Lm MODIFIER LETTER SMALL THETA
+1F00..1F15 ; Greek # L& [22] GREEK SMALL LETTER ALPHA WITH PSILI..GREEK SMALL LETTER EPSILON WITH DASIA AND OXIA
+1F18..1F1D ; Greek # L& [6] GREEK CAPITAL LETTER EPSILON WITH PSILI..GREEK CAPITAL LETTER EPSILON WITH DASIA AND OXIA
+1F20..1F45 ; Greek # L& [38] GREEK SMALL LETTER ETA WITH PSILI..GREEK SMALL LETTER OMICRON WITH DASIA AND OXIA
+1F48..1F4D ; Greek # L& [6] GREEK CAPITAL LETTER OMICRON WITH PSILI..GREEK CAPITAL LETTER OMICRON WITH DASIA AND OXIA
+1F50..1F57 ; Greek # L& [8] GREEK SMALL LETTER UPSILON WITH PSILI..GREEK SMALL LETTER UPSILON WITH DASIA AND PERISPOMENI
+1F59 ; Greek # L& GREEK CAPITAL LETTER UPSILON WITH DASIA
+1F5B ; Greek # L& GREEK CAPITAL LETTER UPSILON WITH DASIA AND VARIA
+1F5D ; Greek # L& GREEK CAPITAL LETTER UPSILON WITH DASIA AND OXIA
+1F5F..1F7D ; Greek # L& [31] GREEK CAPITAL LETTER UPSILON WITH DASIA AND PERISPOMENI..GREEK SMALL LETTER OMEGA WITH OXIA
+1F80..1FB4 ; Greek # L& [53] GREEK SMALL LETTER ALPHA WITH PSILI AND YPOGEGRAMMENI..GREEK SMALL LETTER ALPHA WITH OXIA AND YPOGEGRAMMENI
+1FB6..1FBC ; Greek # L& [7] GREEK SMALL LETTER ALPHA WITH PERISPOMENI..GREEK CAPITAL LETTER ALPHA WITH PROSGEGRAMMENI
+1FBD ; Greek # Sk GREEK KORONIS
+1FBE ; Greek # L& GREEK PROSGEGRAMMENI
+1FBF..1FC1 ; Greek # Sk [3] GREEK PSILI..GREEK DIALYTIKA AND PERISPOMENI
+1FC2..1FC4 ; Greek # L& [3] GREEK SMALL LETTER ETA WITH VARIA AND YPOGEGRAMMENI..GREEK SMALL LETTER ETA WITH OXIA AND YPOGEGRAMMENI
+1FC6..1FCC ; Greek # L& [7] GREEK SMALL LETTER ETA WITH PERISPOMENI..GREEK CAPITAL LETTER ETA WITH PROSGEGRAMMENI
+1FCD..1FCF ; Greek # Sk [3] GREEK PSILI AND VARIA..GREEK PSILI AND PERISPOMENI
+1FD0..1FD3 ; Greek # L& [4] GREEK SMALL LETTER IOTA WITH VRACHY..GREEK SMALL LETTER IOTA WITH DIALYTIKA AND OXIA
+1FD6..1FDB ; Greek # L& [6] GREEK SMALL LETTER IOTA WITH PERISPOMENI..GREEK CAPITAL LETTER IOTA WITH OXIA
+1FDD..1FDF ; Greek # Sk [3] GREEK DASIA AND VARIA..GREEK DASIA AND PERISPOMENI
+1FE0..1FEC ; Greek # L& [13] GREEK SMALL LETTER UPSILON WITH VRACHY..GREEK CAPITAL LETTER RHO WITH DASIA
+1FED..1FEF ; Greek # Sk [3] GREEK DIALYTIKA AND VARIA..GREEK VARIA
+1FF2..1FF4 ; Greek # L& [3] GREEK SMALL LETTER OMEGA WITH VARIA AND YPOGEGRAMMENI..GREEK SMALL LETTER OMEGA WITH OXIA AND YPOGEGRAMMENI
+1FF6..1FFC ; Greek # L& [7] GREEK SMALL LETTER OMEGA WITH PERISPOMENI..GREEK CAPITAL LETTER OMEGA WITH PROSGEGRAMMENI
+1FFD..1FFE ; Greek # Sk [2] GREEK OXIA..GREEK DASIA
+2126 ; Greek # L& OHM SIGN
+AB65 ; Greek # L& GREEK LETTER SMALL CAPITAL OMEGA
+10140..10174 ; Greek # Nl [53] GREEK ACROPHONIC ATTIC ONE QUARTER..GREEK ACROPHONIC STRATIAN FIFTY MNAS
+10175..10178 ; Greek # No [4] GREEK ONE HALF SIGN..GREEK THREE QUARTERS SIGN
+10179..10189 ; Greek # So [17] GREEK YEAR SIGN..GREEK TRYBLION BASE SIGN
+1018A..1018B ; Greek # No [2] GREEK ZERO SIGN..GREEK ONE QUARTER SIGN
+1018C..1018E ; Greek # So [3] GREEK SINUSOID SIGN..NOMISMA SIGN
+101A0 ; Greek # So GREEK SYMBOL TAU RHO
+1D200..1D241 ; Greek # So [66] GREEK VOCAL NOTATION SYMBOL-1..GREEK INSTRUMENTAL NOTATION SYMBOL-54
+1D242..1D244 ; Greek # Mn [3] COMBINING GREEK MUSICAL TRISEME..COMBINING GREEK MUSICAL PENTASEME
+1D245 ; Greek # So GREEK MUSICAL LEIMMA
+
+# Total code points: 518
+
+# ================================================
+
+0400..0481 ; Cyrillic # L& [130] CYRILLIC CAPITAL LETTER IE WITH GRAVE..CYRILLIC SMALL LETTER KOPPA
+0482 ; Cyrillic # So CYRILLIC THOUSANDS SIGN
+0483..0484 ; Cyrillic # Mn [2] COMBINING CYRILLIC TITLO..COMBINING CYRILLIC PALATALIZATION
+0487 ; Cyrillic # Mn COMBINING CYRILLIC POKRYTIE
+0488..0489 ; Cyrillic # Me [2] COMBINING CYRILLIC HUNDRED THOUSANDS SIGN..COMBINING CYRILLIC MILLIONS SIGN
+048A..052F ; Cyrillic # L& [166] CYRILLIC CAPITAL LETTER SHORT I WITH TAIL..CYRILLIC SMALL LETTER EL WITH DESCENDER
+1C80..1C88 ; Cyrillic # L& [9] CYRILLIC SMALL LETTER ROUNDED VE..CYRILLIC SMALL LETTER UNBLENDED UK
+1D2B ; Cyrillic # L& CYRILLIC LETTER SMALL CAPITAL EL
+1D78 ; Cyrillic # Lm MODIFIER LETTER CYRILLIC EN
+2DE0..2DFF ; Cyrillic # Mn [32] COMBINING CYRILLIC LETTER BE..COMBINING CYRILLIC LETTER IOTIFIED BIG YUS
+A640..A66D ; Cyrillic # L& [46] CYRILLIC CAPITAL LETTER ZEMLYA..CYRILLIC SMALL LETTER DOUBLE MONOCULAR O
+A66E ; Cyrillic # Lo CYRILLIC LETTER MULTIOCULAR O
+A66F ; Cyrillic # Mn COMBINING CYRILLIC VZMET
+A670..A672 ; Cyrillic # Me [3] COMBINING CYRILLIC TEN MILLIONS SIGN..COMBINING CYRILLIC THOUSAND MILLIONS SIGN
+A673 ; Cyrillic # Po SLAVONIC ASTERISK
+A674..A67D ; Cyrillic # Mn [10] COMBINING CYRILLIC LETTER UKRAINIAN IE..COMBINING CYRILLIC PAYEROK
+A67E ; Cyrillic # Po CYRILLIC KAVYKA
+A67F ; Cyrillic # Lm CYRILLIC PAYEROK
+A680..A69B ; Cyrillic # L& [28] CYRILLIC CAPITAL LETTER DWE..CYRILLIC SMALL LETTER CROSSED O
+A69C..A69D ; Cyrillic # Lm [2] MODIFIER LETTER CYRILLIC HARD SIGN..MODIFIER LETTER CYRILLIC SOFT SIGN
+A69E..A69F ; Cyrillic # Mn [2] COMBINING CYRILLIC LETTER EF..COMBINING CYRILLIC LETTER IOTIFIED E
+FE2E..FE2F ; Cyrillic # Mn [2] COMBINING CYRILLIC TITLO LEFT HALF..COMBINING CYRILLIC TITLO RIGHT HALF
+1E030..1E06D ; Cyrillic # Lm [62] MODIFIER LETTER CYRILLIC SMALL A..MODIFIER LETTER CYRILLIC SMALL STRAIGHT U WITH STROKE
+1E08F ; Cyrillic # Mn COMBINING CYRILLIC SMALL LETTER BYELORUSSIAN-UKRAINIAN I
+
+# Total code points: 506
+
+# ================================================
+
+0531..0556 ; Armenian # L& [38] ARMENIAN CAPITAL LETTER AYB..ARMENIAN CAPITAL LETTER FEH
+0559 ; Armenian # Lm ARMENIAN MODIFIER LETTER LEFT HALF RING
+055A..055F ; Armenian # Po [6] ARMENIAN APOSTROPHE..ARMENIAN ABBREVIATION MARK
+0560..0588 ; Armenian # L& [41] ARMENIAN SMALL LETTER TURNED AYB..ARMENIAN SMALL LETTER YI WITH STROKE
+0589 ; Armenian # Po ARMENIAN FULL STOP
+058A ; Armenian # Pd ARMENIAN HYPHEN
+058D..058E ; Armenian # So [2] RIGHT-FACING ARMENIAN ETERNITY SIGN..LEFT-FACING ARMENIAN ETERNITY SIGN
+058F ; Armenian # Sc ARMENIAN DRAM SIGN
+FB13..FB17 ; Armenian # L& [5] ARMENIAN SMALL LIGATURE MEN NOW..ARMENIAN SMALL LIGATURE MEN XEH
+
+# Total code points: 96
+
+# ================================================
+
+0591..05BD ; Hebrew # Mn [45] HEBREW ACCENT ETNAHTA..HEBREW POINT METEG
+05BE ; Hebrew # Pd HEBREW PUNCTUATION MAQAF
+05BF ; Hebrew # Mn HEBREW POINT RAFE
+05C0 ; Hebrew # Po HEBREW PUNCTUATION PASEQ
+05C1..05C2 ; Hebrew # Mn [2] HEBREW POINT SHIN DOT..HEBREW POINT SIN DOT
+05C3 ; Hebrew # Po HEBREW PUNCTUATION SOF PASUQ
+05C4..05C5 ; Hebrew # Mn [2] HEBREW MARK UPPER DOT..HEBREW MARK LOWER DOT
+05C6 ; Hebrew # Po HEBREW PUNCTUATION NUN HAFUKHA
+05C7 ; Hebrew # Mn HEBREW POINT QAMATS QATAN
+05D0..05EA ; Hebrew # Lo [27] HEBREW LETTER ALEF..HEBREW LETTER TAV
+05EF..05F2 ; Hebrew # Lo [4] HEBREW YOD TRIANGLE..HEBREW LIGATURE YIDDISH DOUBLE YOD
+05F3..05F4 ; Hebrew # Po [2] HEBREW PUNCTUATION GERESH..HEBREW PUNCTUATION GERSHAYIM
+FB1D ; Hebrew # Lo HEBREW LETTER YOD WITH HIRIQ
+FB1E ; Hebrew # Mn HEBREW POINT JUDEO-SPANISH VARIKA
+FB1F..FB28 ; Hebrew # Lo [10] HEBREW LIGATURE YIDDISH YOD YOD PATAH..HEBREW LETTER WIDE TAV
+FB29 ; Hebrew # Sm HEBREW LETTER ALTERNATIVE PLUS SIGN
+FB2A..FB36 ; Hebrew # Lo [13] HEBREW LETTER SHIN WITH SHIN DOT..HEBREW LETTER ZAYIN WITH DAGESH
+FB38..FB3C ; Hebrew # Lo [5] HEBREW LETTER TET WITH DAGESH..HEBREW LETTER LAMED WITH DAGESH
+FB3E ; Hebrew # Lo HEBREW LETTER MEM WITH DAGESH
+FB40..FB41 ; Hebrew # Lo [2] HEBREW LETTER NUN WITH DAGESH..HEBREW LETTER SAMEKH WITH DAGESH
+FB43..FB44 ; Hebrew # Lo [2] HEBREW LETTER FINAL PE WITH DAGESH..HEBREW LETTER PE WITH DAGESH
+FB46..FB4F ; Hebrew # Lo [10] HEBREW LETTER TSADI WITH DAGESH..HEBREW LIGATURE ALEF LAMED
+
+# Total code points: 134
+
+# ================================================
+
+0600..0604 ; Arabic # Cf [5] ARABIC NUMBER SIGN..ARABIC SIGN SAMVAT
+0606..0608 ; Arabic # Sm [3] ARABIC-INDIC CUBE ROOT..ARABIC RAY
+0609..060A ; Arabic # Po [2] ARABIC-INDIC PER MILLE SIGN..ARABIC-INDIC PER TEN THOUSAND SIGN
+060B ; Arabic # Sc AFGHANI SIGN
+060D ; Arabic # Po ARABIC DATE SEPARATOR
+060E..060F ; Arabic # So [2] ARABIC POETIC VERSE SIGN..ARABIC SIGN MISRA
+0610..061A ; Arabic # Mn [11] ARABIC SIGN SALLALLAHOU ALAYHE WASSALLAM..ARABIC SMALL KASRA
+061C ; Arabic # Cf ARABIC LETTER MARK
+061D..061E ; Arabic # Po [2] ARABIC END OF TEXT MARK..ARABIC TRIPLE DOT PUNCTUATION MARK
+0620..063F ; Arabic # Lo [32] ARABIC LETTER KASHMIRI YEH..ARABIC LETTER FARSI YEH WITH THREE DOTS ABOVE
+0641..064A ; Arabic # Lo [10] ARABIC LETTER FEH..ARABIC LETTER YEH
+0656..065F ; Arabic # Mn [10] ARABIC SUBSCRIPT ALEF..ARABIC WAVY HAMZA BELOW
+0660..0669 ; Arabic # Nd [10] ARABIC-INDIC DIGIT ZERO..ARABIC-INDIC DIGIT NINE
+066A..066D ; Arabic # Po [4] ARABIC PERCENT SIGN..ARABIC FIVE POINTED STAR
+066E..066F ; Arabic # Lo [2] ARABIC LETTER DOTLESS BEH..ARABIC LETTER DOTLESS QAF
+0671..06D3 ; Arabic # Lo [99] ARABIC LETTER ALEF WASLA..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE
+06D4 ; Arabic # Po ARABIC FULL STOP
+06D5 ; Arabic # Lo ARABIC LETTER AE
+06D6..06DC ; Arabic # Mn [7] ARABIC SMALL HIGH LIGATURE SAD WITH LAM WITH ALEF MAKSURA..ARABIC SMALL HIGH SEEN
+06DE ; Arabic # So ARABIC START OF RUB EL HIZB
+06DF..06E4 ; Arabic # Mn [6] ARABIC SMALL HIGH ROUNDED ZERO..ARABIC SMALL HIGH MADDA
+06E5..06E6 ; Arabic # Lm [2] ARABIC SMALL WAW..ARABIC SMALL YEH
+06E7..06E8 ; Arabic # Mn [2] ARABIC SMALL HIGH YEH..ARABIC SMALL HIGH NOON
+06E9 ; Arabic # So ARABIC PLACE OF SAJDAH
+06EA..06ED ; Arabic # Mn [4] ARABIC EMPTY CENTRE LOW STOP..ARABIC SMALL LOW MEEM
+06EE..06EF ; Arabic # Lo [2] ARABIC LETTER DAL WITH INVERTED V..ARABIC LETTER REH WITH INVERTED V
+06F0..06F9 ; Arabic # Nd [10] EXTENDED ARABIC-INDIC DIGIT ZERO..EXTENDED ARABIC-INDIC DIGIT NINE
+06FA..06FC ; Arabic # Lo [3] ARABIC LETTER SHEEN WITH DOT BELOW..ARABIC LETTER GHAIN WITH DOT BELOW
+06FD..06FE ; Arabic # So [2] ARABIC SIGN SINDHI AMPERSAND..ARABIC SIGN SINDHI POSTPOSITION MEN
+06FF ; Arabic # Lo ARABIC LETTER HEH WITH INVERTED V
+0750..077F ; Arabic # Lo [48] ARABIC LETTER BEH WITH THREE DOTS HORIZONTALLY BELOW..ARABIC LETTER KAF WITH TWO DOTS ABOVE
+0870..0887 ; Arabic # Lo [24] ARABIC LETTER ALEF WITH ATTACHED FATHA..ARABIC BASELINE ROUND DOT
+0888 ; Arabic # Sk ARABIC RAISED ROUND DOT
+0889..088E ; Arabic # Lo [6] ARABIC LETTER NOON WITH INVERTED SMALL V..ARABIC VERTICAL TAIL
+0890..0891 ; Arabic # Cf [2] ARABIC POUND MARK ABOVE..ARABIC PIASTRE MARK ABOVE
+0898..089F ; Arabic # Mn [8] ARABIC SMALL HIGH WORD AL-JUZ..ARABIC HALF MADDA OVER MADDA
+08A0..08C8 ; Arabic # Lo [41] ARABIC LETTER BEH WITH SMALL V BELOW..ARABIC LETTER GRAF
+08C9 ; Arabic # Lm ARABIC SMALL FARSI YEH
+08CA..08E1 ; Arabic # Mn [24] ARABIC SMALL HIGH FARSI YEH..ARABIC SMALL HIGH SIGN SAFHA
+08E3..08FF ; Arabic # Mn [29] ARABIC TURNED DAMMA BELOW..ARABIC MARK SIDEWAYS NOON GHUNNA
+FB50..FBB1 ; Arabic # Lo [98] ARABIC LETTER ALEF WASLA ISOLATED FORM..ARABIC LETTER YEH BARREE WITH HAMZA ABOVE FINAL FORM
+FBB2..FBC2 ; Arabic # Sk [17] ARABIC SYMBOL DOT ABOVE..ARABIC SYMBOL WASLA ABOVE
+FBD3..FD3D ; Arabic # Lo [363] ARABIC LETTER NG ISOLATED FORM..ARABIC LIGATURE ALEF WITH FATHATAN ISOLATED FORM
+FD40..FD4F ; Arabic # So [16] ARABIC LIGATURE RAHIMAHU ALLAAH..ARABIC LIGATURE RAHIMAHUM ALLAAH
+FD50..FD8F ; Arabic # Lo [64] ARABIC LIGATURE TEH WITH JEEM WITH MEEM INITIAL FORM..ARABIC LIGATURE MEEM WITH KHAH WITH MEEM INITIAL FORM
+FD92..FDC7 ; Arabic # Lo [54] ARABIC LIGATURE MEEM WITH JEEM WITH KHAH INITIAL FORM..ARABIC LIGATURE NOON WITH JEEM WITH YEH FINAL FORM
+FDCF ; Arabic # So ARABIC LIGATURE SALAAMUHU ALAYNAA
+FDF0..FDFB ; Arabic # Lo [12] ARABIC LIGATURE SALLA USED AS KORANIC STOP SIGN ISOLATED FORM..ARABIC LIGATURE JALLAJALALOUHOU
+FDFC ; Arabic # Sc RIAL SIGN
+FDFD..FDFF ; Arabic # So [3] ARABIC LIGATURE BISMILLAH AR-RAHMAN AR-RAHEEM..ARABIC LIGATURE AZZA WA JALL
+FE70..FE74 ; Arabic # Lo [5] ARABIC FATHATAN ISOLATED FORM..ARABIC KASRATAN ISOLATED FORM
+FE76..FEFC ; Arabic # Lo [135] ARABIC FATHA ISOLATED FORM..ARABIC LIGATURE LAM WITH ALEF FINAL FORM
+10E60..10E7E ; Arabic # No [31] RUMI DIGIT ONE..RUMI FRACTION TWO THIRDS
+10EFD..10EFF ; Arabic # Mn [3] ARABIC SMALL LOW WORD SAKTA..ARABIC SMALL LOW WORD MADDA
+1EE00..1EE03 ; Arabic # Lo [4] ARABIC MATHEMATICAL ALEF..ARABIC MATHEMATICAL DAL
+1EE05..1EE1F ; Arabic # Lo [27] ARABIC MATHEMATICAL WAW..ARABIC MATHEMATICAL DOTLESS QAF
+1EE21..1EE22 ; Arabic # Lo [2] ARABIC MATHEMATICAL INITIAL BEH..ARABIC MATHEMATICAL INITIAL JEEM
+1EE24 ; Arabic # Lo ARABIC MATHEMATICAL INITIAL HEH
+1EE27 ; Arabic # Lo ARABIC MATHEMATICAL INITIAL HAH
+1EE29..1EE32 ; Arabic # Lo [10] ARABIC MATHEMATICAL INITIAL YEH..ARABIC MATHEMATICAL INITIAL QAF
+1EE34..1EE37 ; Arabic # Lo [4] ARABIC MATHEMATICAL INITIAL SHEEN..ARABIC MATHEMATICAL INITIAL KHAH
+1EE39 ; Arabic # Lo ARABIC MATHEMATICAL INITIAL DAD
+1EE3B ; Arabic # Lo ARABIC MATHEMATICAL INITIAL GHAIN
+1EE42 ; Arabic # Lo ARABIC MATHEMATICAL TAILED JEEM
+1EE47 ; Arabic # Lo ARABIC MATHEMATICAL TAILED HAH
+1EE49 ; Arabic # Lo ARABIC MATHEMATICAL TAILED YEH
+1EE4B ; Arabic # Lo ARABIC MATHEMATICAL TAILED LAM
+1EE4D..1EE4F ; Arabic # Lo [3] ARABIC MATHEMATICAL TAILED NOON..ARABIC MATHEMATICAL TAILED AIN
+1EE51..1EE52 ; Arabic # Lo [2] ARABIC MATHEMATICAL TAILED SAD..ARABIC MATHEMATICAL TAILED QAF
+1EE54 ; Arabic # Lo ARABIC MATHEMATICAL TAILED SHEEN
+1EE57 ; Arabic # Lo ARABIC MATHEMATICAL TAILED KHAH
+1EE59 ; Arabic # Lo ARABIC MATHEMATICAL TAILED DAD
+1EE5B ; Arabic # Lo ARABIC MATHEMATICAL TAILED GHAIN
+1EE5D ; Arabic # Lo ARABIC MATHEMATICAL TAILED DOTLESS NOON
+1EE5F ; Arabic # Lo ARABIC MATHEMATICAL TAILED DOTLESS QAF
+1EE61..1EE62 ; Arabic # Lo [2] ARABIC MATHEMATICAL STRETCHED BEH..ARABIC MATHEMATICAL STRETCHED JEEM
+1EE64 ; Arabic # Lo ARABIC MATHEMATICAL STRETCHED HEH
+1EE67..1EE6A ; Arabic # Lo [4] ARABIC MATHEMATICAL STRETCHED HAH..ARABIC MATHEMATICAL STRETCHED KAF
+1EE6C..1EE72 ; Arabic # Lo [7] ARABIC MATHEMATICAL STRETCHED MEEM..ARABIC MATHEMATICAL STRETCHED QAF
+1EE74..1EE77 ; Arabic # Lo [4] ARABIC MATHEMATICAL STRETCHED SHEEN..ARABIC MATHEMATICAL STRETCHED KHAH
+1EE79..1EE7C ; Arabic # Lo [4] ARABIC MATHEMATICAL STRETCHED DAD..ARABIC MATHEMATICAL STRETCHED DOTLESS BEH
+1EE7E ; Arabic # Lo ARABIC MATHEMATICAL STRETCHED DOTLESS FEH
+1EE80..1EE89 ; Arabic # Lo [10] ARABIC MATHEMATICAL LOOPED ALEF..ARABIC MATHEMATICAL LOOPED YEH
+1EE8B..1EE9B ; Arabic # Lo [17] ARABIC MATHEMATICAL LOOPED LAM..ARABIC MATHEMATICAL LOOPED GHAIN
+1EEA1..1EEA3 ; Arabic # Lo [3] ARABIC MATHEMATICAL DOUBLE-STRUCK BEH..ARABIC MATHEMATICAL DOUBLE-STRUCK DAL
+1EEA5..1EEA9 ; Arabic # Lo [5] ARABIC MATHEMATICAL DOUBLE-STRUCK WAW..ARABIC MATHEMATICAL DOUBLE-STRUCK YEH
+1EEAB..1EEBB ; Arabic # Lo [17] ARABIC MATHEMATICAL DOUBLE-STRUCK LAM..ARABIC MATHEMATICAL DOUBLE-STRUCK GHAIN
+1EEF0..1EEF1 ; Arabic # Sm [2] ARABIC MATHEMATICAL OPERATOR MEEM WITH HAH WITH TATWEEL..ARABIC MATHEMATICAL OPERATOR HAH WITH DAL
+
+# Total code points: 1368
+
+# ================================================
+
+0700..070D ; Syriac # Po [14] SYRIAC END OF PARAGRAPH..SYRIAC HARKLEAN ASTERISCUS
+070F ; Syriac # Cf SYRIAC ABBREVIATION MARK
+0710 ; Syriac # Lo SYRIAC LETTER ALAPH
+0711 ; Syriac # Mn SYRIAC LETTER SUPERSCRIPT ALAPH
+0712..072F ; Syriac # Lo [30] SYRIAC LETTER BETH..SYRIAC LETTER PERSIAN DHALATH
+0730..074A ; Syriac # Mn [27] SYRIAC PTHAHA ABOVE..SYRIAC BARREKH
+074D..074F ; Syriac # Lo [3] SYRIAC LETTER SOGDIAN ZHAIN..SYRIAC LETTER SOGDIAN FE
+0860..086A ; Syriac # Lo [11] SYRIAC LETTER MALAYALAM NGA..SYRIAC LETTER MALAYALAM SSA
+
+# Total code points: 88
+
+# ================================================
+
+0780..07A5 ; Thaana # Lo [38] THAANA LETTER HAA..THAANA LETTER WAAVU
+07A6..07B0 ; Thaana # Mn [11] THAANA ABAFILI..THAANA SUKUN
+07B1 ; Thaana # Lo THAANA LETTER NAA
+
+# Total code points: 50
+
+# ================================================
+
+0900..0902 ; Devanagari # Mn [3] DEVANAGARI SIGN INVERTED CANDRABINDU..DEVANAGARI SIGN ANUSVARA
+0903 ; Devanagari # Mc DEVANAGARI SIGN VISARGA
+0904..0939 ; Devanagari # Lo [54] DEVANAGARI LETTER SHORT A..DEVANAGARI LETTER HA
+093A ; Devanagari # Mn DEVANAGARI VOWEL SIGN OE
+093B ; Devanagari # Mc DEVANAGARI VOWEL SIGN OOE
+093C ; Devanagari # Mn DEVANAGARI SIGN NUKTA
+093D ; Devanagari # Lo DEVANAGARI SIGN AVAGRAHA
+093E..0940 ; Devanagari # Mc [3] DEVANAGARI VOWEL SIGN AA..DEVANAGARI VOWEL SIGN II
+0941..0948 ; Devanagari # Mn [8] DEVANAGARI VOWEL SIGN U..DEVANAGARI VOWEL SIGN AI
+0949..094C ; Devanagari # Mc [4] DEVANAGARI VOWEL SIGN CANDRA O..DEVANAGARI VOWEL SIGN AU
+094D ; Devanagari # Mn DEVANAGARI SIGN VIRAMA
+094E..094F ; Devanagari # Mc [2] DEVANAGARI VOWEL SIGN PRISHTHAMATRA E..DEVANAGARI VOWEL SIGN AW
+0950 ; Devanagari # Lo DEVANAGARI OM
+0955..0957 ; Devanagari # Mn [3] DEVANAGARI VOWEL SIGN CANDRA LONG E..DEVANAGARI VOWEL SIGN UUE
+0958..0961 ; Devanagari # Lo [10] DEVANAGARI LETTER QA..DEVANAGARI LETTER VOCALIC LL
+0962..0963 ; Devanagari # Mn [2] DEVANAGARI VOWEL SIGN VOCALIC L..DEVANAGARI VOWEL SIGN VOCALIC LL
+0966..096F ; Devanagari # Nd [10] DEVANAGARI DIGIT ZERO..DEVANAGARI DIGIT NINE
+0970 ; Devanagari # Po DEVANAGARI ABBREVIATION SIGN
+0971 ; Devanagari # Lm DEVANAGARI SIGN HIGH SPACING DOT
+0972..097F ; Devanagari # Lo [14] DEVANAGARI LETTER CANDRA A..DEVANAGARI LETTER BBA
+A8E0..A8F1 ; Devanagari # Mn [18] COMBINING DEVANAGARI DIGIT ZERO..COMBINING DEVANAGARI SIGN AVAGRAHA
+A8F2..A8F7 ; Devanagari # Lo [6] DEVANAGARI SIGN SPACING CANDRABINDU..DEVANAGARI SIGN CANDRABINDU AVAGRAHA
+A8F8..A8FA ; Devanagari # Po [3] DEVANAGARI SIGN PUSHPIKA..DEVANAGARI CARET
+A8FB ; Devanagari # Lo DEVANAGARI HEADSTROKE
+A8FC ; Devanagari # Po DEVANAGARI SIGN SIDDHAM
+A8FD..A8FE ; Devanagari # Lo [2] DEVANAGARI JAIN OM..DEVANAGARI LETTER AY
+A8FF ; Devanagari # Mn DEVANAGARI VOWEL SIGN AY
+11B00..11B09 ; Devanagari # Po [10] DEVANAGARI HEAD MARK..DEVANAGARI SIGN MINDU
+
+# Total code points: 164
+
+# ================================================
+
+0980 ; Bengali # Lo BENGALI ANJI
+0981 ; Bengali # Mn BENGALI SIGN CANDRABINDU
+0982..0983 ; Bengali # Mc [2] BENGALI SIGN ANUSVARA..BENGALI SIGN VISARGA
+0985..098C ; Bengali # Lo [8] BENGALI LETTER A..BENGALI LETTER VOCALIC L
+098F..0990 ; Bengali # Lo [2] BENGALI LETTER E..BENGALI LETTER AI
+0993..09A8 ; Bengali # Lo [22] BENGALI LETTER O..BENGALI LETTER NA
+09AA..09B0 ; Bengali # Lo [7] BENGALI LETTER PA..BENGALI LETTER RA
+09B2 ; Bengali # Lo BENGALI LETTER LA
+09B6..09B9 ; Bengali # Lo [4] BENGALI LETTER SHA..BENGALI LETTER HA
+09BC ; Bengali # Mn BENGALI SIGN NUKTA
+09BD ; Bengali # Lo BENGALI SIGN AVAGRAHA
+09BE..09C0 ; Bengali # Mc [3] BENGALI VOWEL SIGN AA..BENGALI VOWEL SIGN II
+09C1..09C4 ; Bengali # Mn [4] BENGALI VOWEL SIGN U..BENGALI VOWEL SIGN VOCALIC RR
+09C7..09C8 ; Bengali # Mc [2] BENGALI VOWEL SIGN E..BENGALI VOWEL SIGN AI
+09CB..09CC ; Bengali # Mc [2] BENGALI VOWEL SIGN O..BENGALI VOWEL SIGN AU
+09CD ; Bengali # Mn BENGALI SIGN VIRAMA
+09CE ; Bengali # Lo BENGALI LETTER KHANDA TA
+09D7 ; Bengali # Mc BENGALI AU LENGTH MARK
+09DC..09DD ; Bengali # Lo [2] BENGALI LETTER RRA..BENGALI LETTER RHA
+09DF..09E1 ; Bengali # Lo [3] BENGALI LETTER YYA..BENGALI LETTER VOCALIC LL
+09E2..09E3 ; Bengali # Mn [2] BENGALI VOWEL SIGN VOCALIC L..BENGALI VOWEL SIGN VOCALIC LL
+09E6..09EF ; Bengali # Nd [10] BENGALI DIGIT ZERO..BENGALI DIGIT NINE
+09F0..09F1 ; Bengali # Lo [2] BENGALI LETTER RA WITH MIDDLE DIAGONAL..BENGALI LETTER RA WITH LOWER DIAGONAL
+09F2..09F3 ; Bengali # Sc [2] BENGALI RUPEE MARK..BENGALI RUPEE SIGN
+09F4..09F9 ; Bengali # No [6] BENGALI CURRENCY NUMERATOR ONE..BENGALI CURRENCY DENOMINATOR SIXTEEN
+09FA ; Bengali # So BENGALI ISSHAR
+09FB ; Bengali # Sc BENGALI GANDA MARK
+09FC ; Bengali # Lo BENGALI LETTER VEDIC ANUSVARA
+09FD ; Bengali # Po BENGALI ABBREVIATION SIGN
+09FE ; Bengali # Mn BENGALI SANDHI MARK
+
+# Total code points: 96
+
+# ================================================
+
+0A01..0A02 ; Gurmukhi # Mn [2] GURMUKHI SIGN ADAK BINDI..GURMUKHI SIGN BINDI
+0A03 ; Gurmukhi # Mc GURMUKHI SIGN VISARGA
+0A05..0A0A ; Gurmukhi # Lo [6] GURMUKHI LETTER A..GURMUKHI LETTER UU
+0A0F..0A10 ; Gurmukhi # Lo [2] GURMUKHI LETTER EE..GURMUKHI LETTER AI
+0A13..0A28 ; Gurmukhi # Lo [22] GURMUKHI LETTER OO..GURMUKHI LETTER NA
+0A2A..0A30 ; Gurmukhi # Lo [7] GURMUKHI LETTER PA..GURMUKHI LETTER RA
+0A32..0A33 ; Gurmukhi # Lo [2] GURMUKHI LETTER LA..GURMUKHI LETTER LLA
+0A35..0A36 ; Gurmukhi # Lo [2] GURMUKHI LETTER VA..GURMUKHI LETTER SHA
+0A38..0A39 ; Gurmukhi # Lo [2] GURMUKHI LETTER SA..GURMUKHI LETTER HA
+0A3C ; Gurmukhi # Mn GURMUKHI SIGN NUKTA
+0A3E..0A40 ; Gurmukhi # Mc [3] GURMUKHI VOWEL SIGN AA..GURMUKHI VOWEL SIGN II
+0A41..0A42 ; Gurmukhi # Mn [2] GURMUKHI VOWEL SIGN U..GURMUKHI VOWEL SIGN UU
+0A47..0A48 ; Gurmukhi # Mn [2] GURMUKHI VOWEL SIGN EE..GURMUKHI VOWEL SIGN AI
+0A4B..0A4D ; Gurmukhi # Mn [3] GURMUKHI VOWEL SIGN OO..GURMUKHI SIGN VIRAMA
+0A51 ; Gurmukhi # Mn GURMUKHI SIGN UDAAT
+0A59..0A5C ; Gurmukhi # Lo [4] GURMUKHI LETTER KHHA..GURMUKHI LETTER RRA
+0A5E ; Gurmukhi # Lo GURMUKHI LETTER FA
+0A66..0A6F ; Gurmukhi # Nd [10] GURMUKHI DIGIT ZERO..GURMUKHI DIGIT NINE
+0A70..0A71 ; Gurmukhi # Mn [2] GURMUKHI TIPPI..GURMUKHI ADDAK
+0A72..0A74 ; Gurmukhi # Lo [3] GURMUKHI IRI..GURMUKHI EK ONKAR
+0A75 ; Gurmukhi # Mn GURMUKHI SIGN YAKASH
+0A76 ; Gurmukhi # Po GURMUKHI ABBREVIATION SIGN
+
+# Total code points: 80
+
+# ================================================
+
+0A81..0A82 ; Gujarati # Mn [2] GUJARATI SIGN CANDRABINDU..GUJARATI SIGN ANUSVARA
+0A83 ; Gujarati # Mc GUJARATI SIGN VISARGA
+0A85..0A8D ; Gujarati # Lo [9] GUJARATI LETTER A..GUJARATI VOWEL CANDRA E
+0A8F..0A91 ; Gujarati # Lo [3] GUJARATI LETTER E..GUJARATI VOWEL CANDRA O
+0A93..0AA8 ; Gujarati # Lo [22] GUJARATI LETTER O..GUJARATI LETTER NA
+0AAA..0AB0 ; Gujarati # Lo [7] GUJARATI LETTER PA..GUJARATI LETTER RA
+0AB2..0AB3 ; Gujarati # Lo [2] GUJARATI LETTER LA..GUJARATI LETTER LLA
+0AB5..0AB9 ; Gujarati # Lo [5] GUJARATI LETTER VA..GUJARATI LETTER HA
+0ABC ; Gujarati # Mn GUJARATI SIGN NUKTA
+0ABD ; Gujarati # Lo GUJARATI SIGN AVAGRAHA
+0ABE..0AC0 ; Gujarati # Mc [3] GUJARATI VOWEL SIGN AA..GUJARATI VOWEL SIGN II
+0AC1..0AC5 ; Gujarati # Mn [5] GUJARATI VOWEL SIGN U..GUJARATI VOWEL SIGN CANDRA E
+0AC7..0AC8 ; Gujarati # Mn [2] GUJARATI VOWEL SIGN E..GUJARATI VOWEL SIGN AI
+0AC9 ; Gujarati # Mc GUJARATI VOWEL SIGN CANDRA O
+0ACB..0ACC ; Gujarati # Mc [2] GUJARATI VOWEL SIGN O..GUJARATI VOWEL SIGN AU
+0ACD ; Gujarati # Mn GUJARATI SIGN VIRAMA
+0AD0 ; Gujarati # Lo GUJARATI OM
+0AE0..0AE1 ; Gujarati # Lo [2] GUJARATI LETTER VOCALIC RR..GUJARATI LETTER VOCALIC LL
+0AE2..0AE3 ; Gujarati # Mn [2] GUJARATI VOWEL SIGN VOCALIC L..GUJARATI VOWEL SIGN VOCALIC LL
+0AE6..0AEF ; Gujarati # Nd [10] GUJARATI DIGIT ZERO..GUJARATI DIGIT NINE
+0AF0 ; Gujarati # Po GUJARATI ABBREVIATION SIGN
+0AF1 ; Gujarati # Sc GUJARATI RUPEE SIGN
+0AF9 ; Gujarati # Lo GUJARATI LETTER ZHA
+0AFA..0AFF ; Gujarati # Mn [6] GUJARATI SIGN SUKUN..GUJARATI SIGN TWO-CIRCLE NUKTA ABOVE
+
+# Total code points: 91
+
+# ================================================
+
+0B01 ; Oriya # Mn ORIYA SIGN CANDRABINDU
+0B02..0B03 ; Oriya # Mc [2] ORIYA SIGN ANUSVARA..ORIYA SIGN VISARGA
+0B05..0B0C ; Oriya # Lo [8] ORIYA LETTER A..ORIYA LETTER VOCALIC L
+0B0F..0B10 ; Oriya # Lo [2] ORIYA LETTER E..ORIYA LETTER AI
+0B13..0B28 ; Oriya # Lo [22] ORIYA LETTER O..ORIYA LETTER NA
+0B2A..0B30 ; Oriya # Lo [7] ORIYA LETTER PA..ORIYA LETTER RA
+0B32..0B33 ; Oriya # Lo [2] ORIYA LETTER LA..ORIYA LETTER LLA
+0B35..0B39 ; Oriya # Lo [5] ORIYA LETTER VA..ORIYA LETTER HA
+0B3C ; Oriya # Mn ORIYA SIGN NUKTA
+0B3D ; Oriya # Lo ORIYA SIGN AVAGRAHA
+0B3E ; Oriya # Mc ORIYA VOWEL SIGN AA
+0B3F ; Oriya # Mn ORIYA VOWEL SIGN I
+0B40 ; Oriya # Mc ORIYA VOWEL SIGN II
+0B41..0B44 ; Oriya # Mn [4] ORIYA VOWEL SIGN U..ORIYA VOWEL SIGN VOCALIC RR
+0B47..0B48 ; Oriya # Mc [2] ORIYA VOWEL SIGN E..ORIYA VOWEL SIGN AI
+0B4B..0B4C ; Oriya # Mc [2] ORIYA VOWEL SIGN O..ORIYA VOWEL SIGN AU
+0B4D ; Oriya # Mn ORIYA SIGN VIRAMA
+0B55..0B56 ; Oriya # Mn [2] ORIYA SIGN OVERLINE..ORIYA AI LENGTH MARK
+0B57 ; Oriya # Mc ORIYA AU LENGTH MARK
+0B5C..0B5D ; Oriya # Lo [2] ORIYA LETTER RRA..ORIYA LETTER RHA
+0B5F..0B61 ; Oriya # Lo [3] ORIYA LETTER YYA..ORIYA LETTER VOCALIC LL
+0B62..0B63 ; Oriya # Mn [2] ORIYA VOWEL SIGN VOCALIC L..ORIYA VOWEL SIGN VOCALIC LL
+0B66..0B6F ; Oriya # Nd [10] ORIYA DIGIT ZERO..ORIYA DIGIT NINE
+0B70 ; Oriya # So ORIYA ISSHAR
+0B71 ; Oriya # Lo ORIYA LETTER WA
+0B72..0B77 ; Oriya # No [6] ORIYA FRACTION ONE QUARTER..ORIYA FRACTION THREE SIXTEENTHS
+
+# Total code points: 91
+
+# ================================================
+
+0B82 ; Tamil # Mn TAMIL SIGN ANUSVARA
+0B83 ; Tamil # Lo TAMIL SIGN VISARGA
+0B85..0B8A ; Tamil # Lo [6] TAMIL LETTER A..TAMIL LETTER UU
+0B8E..0B90 ; Tamil # Lo [3] TAMIL LETTER E..TAMIL LETTER AI
+0B92..0B95 ; Tamil # Lo [4] TAMIL LETTER O..TAMIL LETTER KA
+0B99..0B9A ; Tamil # Lo [2] TAMIL LETTER NGA..TAMIL LETTER CA
+0B9C ; Tamil # Lo TAMIL LETTER JA
+0B9E..0B9F ; Tamil # Lo [2] TAMIL LETTER NYA..TAMIL LETTER TTA
+0BA3..0BA4 ; Tamil # Lo [2] TAMIL LETTER NNA..TAMIL LETTER TA
+0BA8..0BAA ; Tamil # Lo [3] TAMIL LETTER NA..TAMIL LETTER PA
+0BAE..0BB9 ; Tamil # Lo [12] TAMIL LETTER MA..TAMIL LETTER HA
+0BBE..0BBF ; Tamil # Mc [2] TAMIL VOWEL SIGN AA..TAMIL VOWEL SIGN I
+0BC0 ; Tamil # Mn TAMIL VOWEL SIGN II
+0BC1..0BC2 ; Tamil # Mc [2] TAMIL VOWEL SIGN U..TAMIL VOWEL SIGN UU
+0BC6..0BC8 ; Tamil # Mc [3] TAMIL VOWEL SIGN E..TAMIL VOWEL SIGN AI
+0BCA..0BCC ; Tamil # Mc [3] TAMIL VOWEL SIGN O..TAMIL VOWEL SIGN AU
+0BCD ; Tamil # Mn TAMIL SIGN VIRAMA
+0BD0 ; Tamil # Lo TAMIL OM
+0BD7 ; Tamil # Mc TAMIL AU LENGTH MARK
+0BE6..0BEF ; Tamil # Nd [10] TAMIL DIGIT ZERO..TAMIL DIGIT NINE
+0BF0..0BF2 ; Tamil # No [3] TAMIL NUMBER TEN..TAMIL NUMBER ONE THOUSAND
+0BF3..0BF8 ; Tamil # So [6] TAMIL DAY SIGN..TAMIL AS ABOVE SIGN
+0BF9 ; Tamil # Sc TAMIL RUPEE SIGN
+0BFA ; Tamil # So TAMIL NUMBER SIGN
+11FC0..11FD4 ; Tamil # No [21] TAMIL FRACTION ONE THREE-HUNDRED-AND-TWENTIETH..TAMIL FRACTION DOWNSCALING FACTOR KIIZH
+11FD5..11FDC ; Tamil # So [8] TAMIL SIGN NEL..TAMIL SIGN MUKKURUNI
+11FDD..11FE0 ; Tamil # Sc [4] TAMIL SIGN KAACU..TAMIL SIGN VARAAKAN
+11FE1..11FF1 ; Tamil # So [17] TAMIL SIGN PAARAM..TAMIL SIGN VAKAIYARAA
+11FFF ; Tamil # Po TAMIL PUNCTUATION END OF TEXT
+
+# Total code points: 123
+
+# ================================================
+
+0C00 ; Telugu # Mn TELUGU SIGN COMBINING CANDRABINDU ABOVE
+0C01..0C03 ; Telugu # Mc [3] TELUGU SIGN CANDRABINDU..TELUGU SIGN VISARGA
+0C04 ; Telugu # Mn TELUGU SIGN COMBINING ANUSVARA ABOVE
+0C05..0C0C ; Telugu # Lo [8] TELUGU LETTER A..TELUGU LETTER VOCALIC L
+0C0E..0C10 ; Telugu # Lo [3] TELUGU LETTER E..TELUGU LETTER AI
+0C12..0C28 ; Telugu # Lo [23] TELUGU LETTER O..TELUGU LETTER NA
+0C2A..0C39 ; Telugu # Lo [16] TELUGU LETTER PA..TELUGU LETTER HA
+0C3C ; Telugu # Mn TELUGU SIGN NUKTA
+0C3D ; Telugu # Lo TELUGU SIGN AVAGRAHA
+0C3E..0C40 ; Telugu # Mn [3] TELUGU VOWEL SIGN AA..TELUGU VOWEL SIGN II
+0C41..0C44 ; Telugu # Mc [4] TELUGU VOWEL SIGN U..TELUGU VOWEL SIGN VOCALIC RR
+0C46..0C48 ; Telugu # Mn [3] TELUGU VOWEL SIGN E..TELUGU VOWEL SIGN AI
+0C4A..0C4D ; Telugu # Mn [4] TELUGU VOWEL SIGN O..TELUGU SIGN VIRAMA
+0C55..0C56 ; Telugu # Mn [2] TELUGU LENGTH MARK..TELUGU AI LENGTH MARK
+0C58..0C5A ; Telugu # Lo [3] TELUGU LETTER TSA..TELUGU LETTER RRRA
+0C5D ; Telugu # Lo TELUGU LETTER NAKAARA POLLU
+0C60..0C61 ; Telugu # Lo [2] TELUGU LETTER VOCALIC RR..TELUGU LETTER VOCALIC LL
+0C62..0C63 ; Telugu # Mn [2] TELUGU VOWEL SIGN VOCALIC L..TELUGU VOWEL SIGN VOCALIC LL
+0C66..0C6F ; Telugu # Nd [10] TELUGU DIGIT ZERO..TELUGU DIGIT NINE
+0C77 ; Telugu # Po TELUGU SIGN SIDDHAM
+0C78..0C7E ; Telugu # No [7] TELUGU FRACTION DIGIT ZERO FOR ODD POWERS OF FOUR..TELUGU FRACTION DIGIT THREE FOR EVEN POWERS OF FOUR
+0C7F ; Telugu # So TELUGU SIGN TUUMU
+
+# Total code points: 100
+
+# ================================================
+
+0C80 ; Kannada # Lo KANNADA SIGN SPACING CANDRABINDU
+0C81 ; Kannada # Mn KANNADA SIGN CANDRABINDU
+0C82..0C83 ; Kannada # Mc [2] KANNADA SIGN ANUSVARA..KANNADA SIGN VISARGA
+0C84 ; Kannada # Po KANNADA SIGN SIDDHAM
+0C85..0C8C ; Kannada # Lo [8] KANNADA LETTER A..KANNADA LETTER VOCALIC L
+0C8E..0C90 ; Kannada # Lo [3] KANNADA LETTER E..KANNADA LETTER AI
+0C92..0CA8 ; Kannada # Lo [23] KANNADA LETTER O..KANNADA LETTER NA
+0CAA..0CB3 ; Kannada # Lo [10] KANNADA LETTER PA..KANNADA LETTER LLA
+0CB5..0CB9 ; Kannada # Lo [5] KANNADA LETTER VA..KANNADA LETTER HA
+0CBC ; Kannada # Mn KANNADA SIGN NUKTA
+0CBD ; Kannada # Lo KANNADA SIGN AVAGRAHA
+0CBE ; Kannada # Mc KANNADA VOWEL SIGN AA
+0CBF ; Kannada # Mn KANNADA VOWEL SIGN I
+0CC0..0CC4 ; Kannada # Mc [5] KANNADA VOWEL SIGN II..KANNADA VOWEL SIGN VOCALIC RR
+0CC6 ; Kannada # Mn KANNADA VOWEL SIGN E
+0CC7..0CC8 ; Kannada # Mc [2] KANNADA VOWEL SIGN EE..KANNADA VOWEL SIGN AI
+0CCA..0CCB ; Kannada # Mc [2] KANNADA VOWEL SIGN O..KANNADA VOWEL SIGN OO
+0CCC..0CCD ; Kannada # Mn [2] KANNADA VOWEL SIGN AU..KANNADA SIGN VIRAMA
+0CD5..0CD6 ; Kannada # Mc [2] KANNADA LENGTH MARK..KANNADA AI LENGTH MARK
+0CDD..0CDE ; Kannada # Lo [2] KANNADA LETTER NAKAARA POLLU..KANNADA LETTER FA
+0CE0..0CE1 ; Kannada # Lo [2] KANNADA LETTER VOCALIC RR..KANNADA LETTER VOCALIC LL
+0CE2..0CE3 ; Kannada # Mn [2] KANNADA VOWEL SIGN VOCALIC L..KANNADA VOWEL SIGN VOCALIC LL
+0CE6..0CEF ; Kannada # Nd [10] KANNADA DIGIT ZERO..KANNADA DIGIT NINE
+0CF1..0CF2 ; Kannada # Lo [2] KANNADA SIGN JIHVAMULIYA..KANNADA SIGN UPADHMANIYA
+0CF3 ; Kannada # Mc KANNADA SIGN COMBINING ANUSVARA ABOVE RIGHT
+
+# Total code points: 91
+
+# ================================================
+
+0D00..0D01 ; Malayalam # Mn [2] MALAYALAM SIGN COMBINING ANUSVARA ABOVE..MALAYALAM SIGN CANDRABINDU
+0D02..0D03 ; Malayalam # Mc [2] MALAYALAM SIGN ANUSVARA..MALAYALAM SIGN VISARGA
+0D04..0D0C ; Malayalam # Lo [9] MALAYALAM LETTER VEDIC ANUSVARA..MALAYALAM LETTER VOCALIC L
+0D0E..0D10 ; Malayalam # Lo [3] MALAYALAM LETTER E..MALAYALAM LETTER AI
+0D12..0D3A ; Malayalam # Lo [41] MALAYALAM LETTER O..MALAYALAM LETTER TTTA
+0D3B..0D3C ; Malayalam # Mn [2] MALAYALAM SIGN VERTICAL BAR VIRAMA..MALAYALAM SIGN CIRCULAR VIRAMA
+0D3D ; Malayalam # Lo MALAYALAM SIGN AVAGRAHA
+0D3E..0D40 ; Malayalam # Mc [3] MALAYALAM VOWEL SIGN AA..MALAYALAM VOWEL SIGN II
+0D41..0D44 ; Malayalam # Mn [4] MALAYALAM VOWEL SIGN U..MALAYALAM VOWEL SIGN VOCALIC RR
+0D46..0D48 ; Malayalam # Mc [3] MALAYALAM VOWEL SIGN E..MALAYALAM VOWEL SIGN AI
+0D4A..0D4C ; Malayalam # Mc [3] MALAYALAM VOWEL SIGN O..MALAYALAM VOWEL SIGN AU
+0D4D ; Malayalam # Mn MALAYALAM SIGN VIRAMA
+0D4E ; Malayalam # Lo MALAYALAM LETTER DOT REPH
+0D4F ; Malayalam # So MALAYALAM SIGN PARA
+0D54..0D56 ; Malayalam # Lo [3] MALAYALAM LETTER CHILLU M..MALAYALAM LETTER CHILLU LLL
+0D57 ; Malayalam # Mc MALAYALAM AU LENGTH MARK
+0D58..0D5E ; Malayalam # No [7] MALAYALAM FRACTION ONE ONE-HUNDRED-AND-SIXTIETH..MALAYALAM FRACTION ONE FIFTH
+0D5F..0D61 ; Malayalam # Lo [3] MALAYALAM LETTER ARCHAIC II..MALAYALAM LETTER VOCALIC LL
+0D62..0D63 ; Malayalam # Mn [2] MALAYALAM VOWEL SIGN VOCALIC L..MALAYALAM VOWEL SIGN VOCALIC LL
+0D66..0D6F ; Malayalam # Nd [10] MALAYALAM DIGIT ZERO..MALAYALAM DIGIT NINE
+0D70..0D78 ; Malayalam # No [9] MALAYALAM NUMBER TEN..MALAYALAM FRACTION THREE SIXTEENTHS
+0D79 ; Malayalam # So MALAYALAM DATE MARK
+0D7A..0D7F ; Malayalam # Lo [6] MALAYALAM LETTER CHILLU NN..MALAYALAM LETTER CHILLU K
+
+# Total code points: 118
+
+# ================================================
+
+0D81 ; Sinhala # Mn SINHALA SIGN CANDRABINDU
+0D82..0D83 ; Sinhala # Mc [2] SINHALA SIGN ANUSVARAYA..SINHALA SIGN VISARGAYA
+0D85..0D96 ; Sinhala # Lo [18] SINHALA LETTER AYANNA..SINHALA LETTER AUYANNA
+0D9A..0DB1 ; Sinhala # Lo [24] SINHALA LETTER ALPAPRAANA KAYANNA..SINHALA LETTER DANTAJA NAYANNA
+0DB3..0DBB ; Sinhala # Lo [9] SINHALA LETTER SANYAKA DAYANNA..SINHALA LETTER RAYANNA
+0DBD ; Sinhala # Lo SINHALA LETTER DANTAJA LAYANNA
+0DC0..0DC6 ; Sinhala # Lo [7] SINHALA LETTER VAYANNA..SINHALA LETTER FAYANNA
+0DCA ; Sinhala # Mn SINHALA SIGN AL-LAKUNA
+0DCF..0DD1 ; Sinhala # Mc [3] SINHALA VOWEL SIGN AELA-PILLA..SINHALA VOWEL SIGN DIGA AEDA-PILLA
+0DD2..0DD4 ; Sinhala # Mn [3] SINHALA VOWEL SIGN KETTI IS-PILLA..SINHALA VOWEL SIGN KETTI PAA-PILLA
+0DD6 ; Sinhala # Mn SINHALA VOWEL SIGN DIGA PAA-PILLA
+0DD8..0DDF ; Sinhala # Mc [8] SINHALA VOWEL SIGN GAETTA-PILLA..SINHALA VOWEL SIGN GAYANUKITTA
+0DE6..0DEF ; Sinhala # Nd [10] SINHALA LITH DIGIT ZERO..SINHALA LITH DIGIT NINE
+0DF2..0DF3 ; Sinhala # Mc [2] SINHALA VOWEL SIGN DIGA GAETTA-PILLA..SINHALA VOWEL SIGN DIGA GAYANUKITTA
+0DF4 ; Sinhala # Po SINHALA PUNCTUATION KUNDDALIYA
+111E1..111F4 ; Sinhala # No [20] SINHALA ARCHAIC DIGIT ONE..SINHALA ARCHAIC NUMBER ONE THOUSAND
+
+# Total code points: 111
+
+# ================================================
+
+0E01..0E30 ; Thai # Lo [48] THAI CHARACTER KO KAI..THAI CHARACTER SARA A
+0E31 ; Thai # Mn THAI CHARACTER MAI HAN-AKAT
+0E32..0E33 ; Thai # Lo [2] THAI CHARACTER SARA AA..THAI CHARACTER SARA AM
+0E34..0E3A ; Thai # Mn [7] THAI CHARACTER SARA I..THAI CHARACTER PHINTHU
+0E40..0E45 ; Thai # Lo [6] THAI CHARACTER SARA E..THAI CHARACTER LAKKHANGYAO
+0E46 ; Thai # Lm THAI CHARACTER MAIYAMOK
+0E47..0E4E ; Thai # Mn [8] THAI CHARACTER MAITAIKHU..THAI CHARACTER YAMAKKAN
+0E4F ; Thai # Po THAI CHARACTER FONGMAN
+0E50..0E59 ; Thai # Nd [10] THAI DIGIT ZERO..THAI DIGIT NINE
+0E5A..0E5B ; Thai # Po [2] THAI CHARACTER ANGKHANKHU..THAI CHARACTER KHOMUT
+
+# Total code points: 86
+
+# ================================================
+
+0E81..0E82 ; Lao # Lo [2] LAO LETTER KO..LAO LETTER KHO SUNG
+0E84 ; Lao # Lo LAO LETTER KHO TAM
+0E86..0E8A ; Lao # Lo [5] LAO LETTER PALI GHA..LAO LETTER SO TAM
+0E8C..0EA3 ; Lao # Lo [24] LAO LETTER PALI JHA..LAO LETTER LO LING
+0EA5 ; Lao # Lo LAO LETTER LO LOOT
+0EA7..0EB0 ; Lao # Lo [10] LAO LETTER WO..LAO VOWEL SIGN A
+0EB1 ; Lao # Mn LAO VOWEL SIGN MAI KAN
+0EB2..0EB3 ; Lao # Lo [2] LAO VOWEL SIGN AA..LAO VOWEL SIGN AM
+0EB4..0EBC ; Lao # Mn [9] LAO VOWEL SIGN I..LAO SEMIVOWEL SIGN LO
+0EBD ; Lao # Lo LAO SEMIVOWEL SIGN NYO
+0EC0..0EC4 ; Lao # Lo [5] LAO VOWEL SIGN E..LAO VOWEL SIGN AI
+0EC6 ; Lao # Lm LAO KO LA
+0EC8..0ECE ; Lao # Mn [7] LAO TONE MAI EK..LAO YAMAKKAN
+0ED0..0ED9 ; Lao # Nd [10] LAO DIGIT ZERO..LAO DIGIT NINE
+0EDC..0EDF ; Lao # Lo [4] LAO HO NO..LAO LETTER KHMU NYO
+
+# Total code points: 83
+
+# ================================================
+
+0F00 ; Tibetan # Lo TIBETAN SYLLABLE OM
+0F01..0F03 ; Tibetan # So [3] TIBETAN MARK GTER YIG MGO TRUNCATED A..TIBETAN MARK GTER YIG MGO -UM GTER TSHEG MA
+0F04..0F12 ; Tibetan # Po [15] TIBETAN MARK INITIAL YIG MGO MDUN MA..TIBETAN MARK RGYA GRAM SHAD
+0F13 ; Tibetan # So TIBETAN MARK CARET -DZUD RTAGS ME LONG CAN
+0F14 ; Tibetan # Po TIBETAN MARK GTER TSHEG
+0F15..0F17 ; Tibetan # So [3] TIBETAN LOGOTYPE SIGN CHAD RTAGS..TIBETAN ASTROLOGICAL SIGN SGRA GCAN -CHAR RTAGS
+0F18..0F19 ; Tibetan # Mn [2] TIBETAN ASTROLOGICAL SIGN -KHYUD PA..TIBETAN ASTROLOGICAL SIGN SDONG TSHUGS
+0F1A..0F1F ; Tibetan # So [6] TIBETAN SIGN RDEL DKAR GCIG..TIBETAN SIGN RDEL DKAR RDEL NAG
+0F20..0F29 ; Tibetan # Nd [10] TIBETAN DIGIT ZERO..TIBETAN DIGIT NINE
+0F2A..0F33 ; Tibetan # No [10] TIBETAN DIGIT HALF ONE..TIBETAN DIGIT HALF ZERO
+0F34 ; Tibetan # So TIBETAN MARK BSDUS RTAGS
+0F35 ; Tibetan # Mn TIBETAN MARK NGAS BZUNG NYI ZLA
+0F36 ; Tibetan # So TIBETAN MARK CARET -DZUD RTAGS BZHI MIG CAN
+0F37 ; Tibetan # Mn TIBETAN MARK NGAS BZUNG SGOR RTAGS
+0F38 ; Tibetan # So TIBETAN MARK CHE MGO
+0F39 ; Tibetan # Mn TIBETAN MARK TSA -PHRU
+0F3A ; Tibetan # Ps TIBETAN MARK GUG RTAGS GYON
+0F3B ; Tibetan # Pe TIBETAN MARK GUG RTAGS GYAS
+0F3C ; Tibetan # Ps TIBETAN MARK ANG KHANG GYON
+0F3D ; Tibetan # Pe TIBETAN MARK ANG KHANG GYAS
+0F3E..0F3F ; Tibetan # Mc [2] TIBETAN SIGN YAR TSHES..TIBETAN SIGN MAR TSHES
+0F40..0F47 ; Tibetan # Lo [8] TIBETAN LETTER KA..TIBETAN LETTER JA
+0F49..0F6C ; Tibetan # Lo [36] TIBETAN LETTER NYA..TIBETAN LETTER RRA
+0F71..0F7E ; Tibetan # Mn [14] TIBETAN VOWEL SIGN AA..TIBETAN SIGN RJES SU NGA RO
+0F7F ; Tibetan # Mc TIBETAN SIGN RNAM BCAD
+0F80..0F84 ; Tibetan # Mn [5] TIBETAN VOWEL SIGN REVERSED I..TIBETAN MARK HALANTA
+0F85 ; Tibetan # Po TIBETAN MARK PALUTA
+0F86..0F87 ; Tibetan # Mn [2] TIBETAN SIGN LCI RTAGS..TIBETAN SIGN YANG RTAGS
+0F88..0F8C ; Tibetan # Lo [5] TIBETAN SIGN LCE TSA CAN..TIBETAN SIGN INVERTED MCHU CAN
+0F8D..0F97 ; Tibetan # Mn [11] TIBETAN SUBJOINED SIGN LCE TSA CAN..TIBETAN SUBJOINED LETTER JA
+0F99..0FBC ; Tibetan # Mn [36] TIBETAN SUBJOINED LETTER NYA..TIBETAN SUBJOINED LETTER FIXED-FORM RA
+0FBE..0FC5 ; Tibetan # So [8] TIBETAN KU RU KHA..TIBETAN SYMBOL RDO RJE
+0FC6 ; Tibetan # Mn TIBETAN SYMBOL PADMA GDAN
+0FC7..0FCC ; Tibetan # So [6] TIBETAN SYMBOL RDO RJE RGYA GRAM..TIBETAN SYMBOL NOR BU BZHI -KHYIL
+0FCE..0FCF ; Tibetan # So [2] TIBETAN SIGN RDEL NAG RDEL DKAR..TIBETAN SIGN RDEL NAG GSUM
+0FD0..0FD4 ; Tibetan # Po [5] TIBETAN MARK BSKA- SHOG GI MGO RGYAN..TIBETAN MARK CLOSING BRDA RNYING YIG MGO SGAB MA
+0FD9..0FDA ; Tibetan # Po [2] TIBETAN MARK LEADING MCHAN RTAGS..TIBETAN MARK TRAILING MCHAN RTAGS
+
+# Total code points: 207
+
+# ================================================
+
+1000..102A ; Myanmar # Lo [43] MYANMAR LETTER KA..MYANMAR LETTER AU
+102B..102C ; Myanmar # Mc [2] MYANMAR VOWEL SIGN TALL AA..MYANMAR VOWEL SIGN AA
+102D..1030 ; Myanmar # Mn [4] MYANMAR VOWEL SIGN I..MYANMAR VOWEL SIGN UU
+1031 ; Myanmar # Mc MYANMAR VOWEL SIGN E
+1032..1037 ; Myanmar # Mn [6] MYANMAR VOWEL SIGN AI..MYANMAR SIGN DOT BELOW
+1038 ; Myanmar # Mc MYANMAR SIGN VISARGA
+1039..103A ; Myanmar # Mn [2] MYANMAR SIGN VIRAMA..MYANMAR SIGN ASAT
+103B..103C ; Myanmar # Mc [2] MYANMAR CONSONANT SIGN MEDIAL YA..MYANMAR CONSONANT SIGN MEDIAL RA
+103D..103E ; Myanmar # Mn [2] MYANMAR CONSONANT SIGN MEDIAL WA..MYANMAR CONSONANT SIGN MEDIAL HA
+103F ; Myanmar # Lo MYANMAR LETTER GREAT SA
+1040..1049 ; Myanmar # Nd [10] MYANMAR DIGIT ZERO..MYANMAR DIGIT NINE
+104A..104F ; Myanmar # Po [6] MYANMAR SIGN LITTLE SECTION..MYANMAR SYMBOL GENITIVE
+1050..1055 ; Myanmar # Lo [6] MYANMAR LETTER SHA..MYANMAR LETTER VOCALIC LL
+1056..1057 ; Myanmar # Mc [2] MYANMAR VOWEL SIGN VOCALIC R..MYANMAR VOWEL SIGN VOCALIC RR
+1058..1059 ; Myanmar # Mn [2] MYANMAR VOWEL SIGN VOCALIC L..MYANMAR VOWEL SIGN VOCALIC LL
+105A..105D ; Myanmar # Lo [4] MYANMAR LETTER MON NGA..MYANMAR LETTER MON BBE
+105E..1060 ; Myanmar # Mn [3] MYANMAR CONSONANT SIGN MON MEDIAL NA..MYANMAR CONSONANT SIGN MON MEDIAL LA
+1061 ; Myanmar # Lo MYANMAR LETTER SGAW KAREN SHA
+1062..1064 ; Myanmar # Mc [3] MYANMAR VOWEL SIGN SGAW KAREN EU..MYANMAR TONE MARK SGAW KAREN KE PHO
+1065..1066 ; Myanmar # Lo [2] MYANMAR LETTER WESTERN PWO KAREN THA..MYANMAR LETTER WESTERN PWO KAREN PWA
+1067..106D ; Myanmar # Mc [7] MYANMAR VOWEL SIGN WESTERN PWO KAREN EU..MYANMAR SIGN WESTERN PWO KAREN TONE-5
+106E..1070 ; Myanmar # Lo [3] MYANMAR LETTER EASTERN PWO KAREN NNA..MYANMAR LETTER EASTERN PWO KAREN GHWA
+1071..1074 ; Myanmar # Mn [4] MYANMAR VOWEL SIGN GEBA KAREN I..MYANMAR VOWEL SIGN KAYAH EE
+1075..1081 ; Myanmar # Lo [13] MYANMAR LETTER SHAN KA..MYANMAR LETTER SHAN HA
+1082 ; Myanmar # Mn MYANMAR CONSONANT SIGN SHAN MEDIAL WA
+1083..1084 ; Myanmar # Mc [2] MYANMAR VOWEL SIGN SHAN AA..MYANMAR VOWEL SIGN SHAN E
+1085..1086 ; Myanmar # Mn [2] MYANMAR VOWEL SIGN SHAN E ABOVE..MYANMAR VOWEL SIGN SHAN FINAL Y
+1087..108C ; Myanmar # Mc [6] MYANMAR SIGN SHAN TONE-2..MYANMAR SIGN SHAN COUNCIL TONE-3
+108D ; Myanmar # Mn MYANMAR SIGN SHAN COUNCIL EMPHATIC TONE
+108E ; Myanmar # Lo MYANMAR LETTER RUMAI PALAUNG FA
+108F ; Myanmar # Mc MYANMAR SIGN RUMAI PALAUNG TONE-5
+1090..1099 ; Myanmar # Nd [10] MYANMAR SHAN DIGIT ZERO..MYANMAR SHAN DIGIT NINE
+109A..109C ; Myanmar # Mc [3] MYANMAR SIGN KHAMTI TONE-1..MYANMAR VOWEL SIGN AITON A
+109D ; Myanmar # Mn MYANMAR VOWEL SIGN AITON AI
+109E..109F ; Myanmar # So [2] MYANMAR SYMBOL SHAN ONE..MYANMAR SYMBOL SHAN EXCLAMATION
+A9E0..A9E4 ; Myanmar # Lo [5] MYANMAR LETTER SHAN GHA..MYANMAR LETTER SHAN BHA
+A9E5 ; Myanmar # Mn MYANMAR SIGN SHAN SAW
+A9E6 ; Myanmar # Lm MYANMAR MODIFIER LETTER SHAN REDUPLICATION
+A9E7..A9EF ; Myanmar # Lo [9] MYANMAR LETTER TAI LAING NYA..MYANMAR LETTER TAI LAING NNA
+A9F0..A9F9 ; Myanmar # Nd [10] MYANMAR TAI LAING DIGIT ZERO..MYANMAR TAI LAING DIGIT NINE
+A9FA..A9FE ; Myanmar # Lo [5] MYANMAR LETTER TAI LAING LLA..MYANMAR LETTER TAI LAING BHA
+AA60..AA6F ; Myanmar # Lo [16] MYANMAR LETTER KHAMTI GA..MYANMAR LETTER KHAMTI FA
+AA70 ; Myanmar # Lm MYANMAR MODIFIER LETTER KHAMTI REDUPLICATION
+AA71..AA76 ; Myanmar # Lo [6] MYANMAR LETTER KHAMTI XA..MYANMAR LOGOGRAM KHAMTI HM
+AA77..AA79 ; Myanmar # So [3] MYANMAR SYMBOL AITON EXCLAMATION..MYANMAR SYMBOL AITON TWO
+AA7A ; Myanmar # Lo MYANMAR LETTER AITON RA
+AA7B ; Myanmar # Mc MYANMAR SIGN PAO KAREN TONE
+AA7C ; Myanmar # Mn MYANMAR SIGN TAI LAING TONE-2
+AA7D ; Myanmar # Mc MYANMAR SIGN TAI LAING TONE-5
+AA7E..AA7F ; Myanmar # Lo [2] MYANMAR LETTER SHWE PALAUNG CHA..MYANMAR LETTER SHWE PALAUNG SHA
+
+# Total code points: 223
+
+# ================================================
+
+10A0..10C5 ; Georgian # L& [38] GEORGIAN CAPITAL LETTER AN..GEORGIAN CAPITAL LETTER HOE
+10C7 ; Georgian # L& GEORGIAN CAPITAL LETTER YN
+10CD ; Georgian # L& GEORGIAN CAPITAL LETTER AEN
+10D0..10FA ; Georgian # L& [43] GEORGIAN LETTER AN..GEORGIAN LETTER AIN
+10FC ; Georgian # Lm MODIFIER LETTER GEORGIAN NAR
+10FD..10FF ; Georgian # L& [3] GEORGIAN LETTER AEN..GEORGIAN LETTER LABIAL SIGN
+1C90..1CBA ; Georgian # L& [43] GEORGIAN MTAVRULI CAPITAL LETTER AN..GEORGIAN MTAVRULI CAPITAL LETTER AIN
+1CBD..1CBF ; Georgian # L& [3] GEORGIAN MTAVRULI CAPITAL LETTER AEN..GEORGIAN MTAVRULI CAPITAL LETTER LABIAL SIGN
+2D00..2D25 ; Georgian # L& [38] GEORGIAN SMALL LETTER AN..GEORGIAN SMALL LETTER HOE
+2D27 ; Georgian # L& GEORGIAN SMALL LETTER YN
+2D2D ; Georgian # L& GEORGIAN SMALL LETTER AEN
+
+# Total code points: 173
+
+# ================================================
+
+1100..11FF ; Hangul # Lo [256] HANGUL CHOSEONG KIYEOK..HANGUL JONGSEONG SSANGNIEUN
+302E..302F ; Hangul # Mc [2] HANGUL SINGLE DOT TONE MARK..HANGUL DOUBLE DOT TONE MARK
+3131..318E ; Hangul # Lo [94] HANGUL LETTER KIYEOK..HANGUL LETTER ARAEAE
+3200..321E ; Hangul # So [31] PARENTHESIZED HANGUL KIYEOK..PARENTHESIZED KOREAN CHARACTER O HU
+3260..327E ; Hangul # So [31] CIRCLED HANGUL KIYEOK..CIRCLED HANGUL IEUNG U
+A960..A97C ; Hangul # Lo [29] HANGUL CHOSEONG TIKEUT-MIEUM..HANGUL CHOSEONG SSANGYEORINHIEUH
+AC00..D7A3 ; Hangul # Lo [11172] HANGUL SYLLABLE GA..HANGUL SYLLABLE HIH
+D7B0..D7C6 ; Hangul # Lo [23] HANGUL JUNGSEONG O-YEO..HANGUL JUNGSEONG ARAEA-E
+D7CB..D7FB ; Hangul # Lo [49] HANGUL JONGSEONG NIEUN-RIEUL..HANGUL JONGSEONG PHIEUPH-THIEUTH
+FFA0..FFBE ; Hangul # Lo [31] HALFWIDTH HANGUL FILLER..HALFWIDTH HANGUL LETTER HIEUH
+FFC2..FFC7 ; Hangul # Lo [6] HALFWIDTH HANGUL LETTER A..HALFWIDTH HANGUL LETTER E
+FFCA..FFCF ; Hangul # Lo [6] HALFWIDTH HANGUL LETTER YEO..HALFWIDTH HANGUL LETTER OE
+FFD2..FFD7 ; Hangul # Lo [6] HALFWIDTH HANGUL LETTER YO..HALFWIDTH HANGUL LETTER YU
+FFDA..FFDC ; Hangul # Lo [3] HALFWIDTH HANGUL LETTER EU..HALFWIDTH HANGUL LETTER I
+
+# Total code points: 11739
+
+# ================================================
+
+1200..1248 ; Ethiopic # Lo [73] ETHIOPIC SYLLABLE HA..ETHIOPIC SYLLABLE QWA
+124A..124D ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE QWI..ETHIOPIC SYLLABLE QWE
+1250..1256 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE QHA..ETHIOPIC SYLLABLE QHO
+1258 ; Ethiopic # Lo ETHIOPIC SYLLABLE QHWA
+125A..125D ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE QHWI..ETHIOPIC SYLLABLE QHWE
+1260..1288 ; Ethiopic # Lo [41] ETHIOPIC SYLLABLE BA..ETHIOPIC SYLLABLE XWA
+128A..128D ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE XWI..ETHIOPIC SYLLABLE XWE
+1290..12B0 ; Ethiopic # Lo [33] ETHIOPIC SYLLABLE NA..ETHIOPIC SYLLABLE KWA
+12B2..12B5 ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE KWI..ETHIOPIC SYLLABLE KWE
+12B8..12BE ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE KXA..ETHIOPIC SYLLABLE KXO
+12C0 ; Ethiopic # Lo ETHIOPIC SYLLABLE KXWA
+12C2..12C5 ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE KXWI..ETHIOPIC SYLLABLE KXWE
+12C8..12D6 ; Ethiopic # Lo [15] ETHIOPIC SYLLABLE WA..ETHIOPIC SYLLABLE PHARYNGEAL O
+12D8..1310 ; Ethiopic # Lo [57] ETHIOPIC SYLLABLE ZA..ETHIOPIC SYLLABLE GWA
+1312..1315 ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE GWI..ETHIOPIC SYLLABLE GWE
+1318..135A ; Ethiopic # Lo [67] ETHIOPIC SYLLABLE GGA..ETHIOPIC SYLLABLE FYA
+135D..135F ; Ethiopic # Mn [3] ETHIOPIC COMBINING GEMINATION AND VOWEL LENGTH MARK..ETHIOPIC COMBINING GEMINATION MARK
+1360..1368 ; Ethiopic # Po [9] ETHIOPIC SECTION MARK..ETHIOPIC PARAGRAPH SEPARATOR
+1369..137C ; Ethiopic # No [20] ETHIOPIC DIGIT ONE..ETHIOPIC NUMBER TEN THOUSAND
+1380..138F ; Ethiopic # Lo [16] ETHIOPIC SYLLABLE SEBATBEIT MWA..ETHIOPIC SYLLABLE PWE
+1390..1399 ; Ethiopic # So [10] ETHIOPIC TONAL MARK YIZET..ETHIOPIC TONAL MARK KURT
+2D80..2D96 ; Ethiopic # Lo [23] ETHIOPIC SYLLABLE LOA..ETHIOPIC SYLLABLE GGWE
+2DA0..2DA6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE SSA..ETHIOPIC SYLLABLE SSO
+2DA8..2DAE ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE CCA..ETHIOPIC SYLLABLE CCO
+2DB0..2DB6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE ZZA..ETHIOPIC SYLLABLE ZZO
+2DB8..2DBE ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE CCHA..ETHIOPIC SYLLABLE CCHO
+2DC0..2DC6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE QYA..ETHIOPIC SYLLABLE QYO
+2DC8..2DCE ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE KYA..ETHIOPIC SYLLABLE KYO
+2DD0..2DD6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE XYA..ETHIOPIC SYLLABLE XYO
+2DD8..2DDE ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE GYA..ETHIOPIC SYLLABLE GYO
+AB01..AB06 ; Ethiopic # Lo [6] ETHIOPIC SYLLABLE TTHU..ETHIOPIC SYLLABLE TTHO
+AB09..AB0E ; Ethiopic # Lo [6] ETHIOPIC SYLLABLE DDHU..ETHIOPIC SYLLABLE DDHO
+AB11..AB16 ; Ethiopic # Lo [6] ETHIOPIC SYLLABLE DZU..ETHIOPIC SYLLABLE DZO
+AB20..AB26 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE CCHHA..ETHIOPIC SYLLABLE CCHHO
+AB28..AB2E ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE BBA..ETHIOPIC SYLLABLE BBO
+1E7E0..1E7E6 ; Ethiopic # Lo [7] ETHIOPIC SYLLABLE HHYA..ETHIOPIC SYLLABLE HHYO
+1E7E8..1E7EB ; Ethiopic # Lo [4] ETHIOPIC SYLLABLE GURAGE HHWA..ETHIOPIC SYLLABLE HHWE
+1E7ED..1E7EE ; Ethiopic # Lo [2] ETHIOPIC SYLLABLE GURAGE MWI..ETHIOPIC SYLLABLE GURAGE MWEE
+1E7F0..1E7FE ; Ethiopic # Lo [15] ETHIOPIC SYLLABLE GURAGE QWI..ETHIOPIC SYLLABLE GURAGE PWEE
+
+# Total code points: 523
+
+# ================================================
+
+13A0..13F5 ; Cherokee # L& [86] CHEROKEE LETTER A..CHEROKEE LETTER MV
+13F8..13FD ; Cherokee # L& [6] CHEROKEE SMALL LETTER YE..CHEROKEE SMALL LETTER MV
+AB70..ABBF ; Cherokee # L& [80] CHEROKEE SMALL LETTER A..CHEROKEE SMALL LETTER YA
+
+# Total code points: 172
+
+# ================================================
+
+1400 ; Canadian_Aboriginal # Pd CANADIAN SYLLABICS HYPHEN
+1401..166C ; Canadian_Aboriginal # Lo [620] CANADIAN SYLLABICS E..CANADIAN SYLLABICS CARRIER TTSA
+166D ; Canadian_Aboriginal # So CANADIAN SYLLABICS CHI SIGN
+166E ; Canadian_Aboriginal # Po CANADIAN SYLLABICS FULL STOP
+166F..167F ; Canadian_Aboriginal # Lo [17] CANADIAN SYLLABICS QAI..CANADIAN SYLLABICS BLACKFOOT W
+18B0..18F5 ; Canadian_Aboriginal # Lo [70] CANADIAN SYLLABICS OY..CANADIAN SYLLABICS CARRIER DENTAL S
+11AB0..11ABF ; Canadian_Aboriginal # Lo [16] CANADIAN SYLLABICS NATTILIK HI..CANADIAN SYLLABICS SPA
+
+# Total code points: 726
+
+# ================================================
+
+1680 ; Ogham # Zs OGHAM SPACE MARK
+1681..169A ; Ogham # Lo [26] OGHAM LETTER BEITH..OGHAM LETTER PEITH
+169B ; Ogham # Ps OGHAM FEATHER MARK
+169C ; Ogham # Pe OGHAM REVERSED FEATHER MARK
+
+# Total code points: 29
+
+# ================================================
+
+16A0..16EA ; Runic # Lo [75] RUNIC LETTER FEHU FEOH FE F..RUNIC LETTER X
+16EE..16F0 ; Runic # Nl [3] RUNIC ARLAUG SYMBOL..RUNIC BELGTHOR SYMBOL
+16F1..16F8 ; Runic # Lo [8] RUNIC LETTER K..RUNIC LETTER FRANKS CASKET AESC
+
+# Total code points: 86
+
+# ================================================
+
+1780..17B3 ; Khmer # Lo [52] KHMER LETTER KA..KHMER INDEPENDENT VOWEL QAU
+17B4..17B5 ; Khmer # Mn [2] KHMER VOWEL INHERENT AQ..KHMER VOWEL INHERENT AA
+17B6 ; Khmer # Mc KHMER VOWEL SIGN AA
+17B7..17BD ; Khmer # Mn [7] KHMER VOWEL SIGN I..KHMER VOWEL SIGN UA
+17BE..17C5 ; Khmer # Mc [8] KHMER VOWEL SIGN OE..KHMER VOWEL SIGN AU
+17C6 ; Khmer # Mn KHMER SIGN NIKAHIT
+17C7..17C8 ; Khmer # Mc [2] KHMER SIGN REAHMUK..KHMER SIGN YUUKALEAPINTU
+17C9..17D3 ; Khmer # Mn [11] KHMER SIGN MUUSIKATOAN..KHMER SIGN BATHAMASAT
+17D4..17D6 ; Khmer # Po [3] KHMER SIGN KHAN..KHMER SIGN CAMNUC PII KUUH
+17D7 ; Khmer # Lm KHMER SIGN LEK TOO
+17D8..17DA ; Khmer # Po [3] KHMER SIGN BEYYAL..KHMER SIGN KOOMUUT
+17DB ; Khmer # Sc KHMER CURRENCY SYMBOL RIEL
+17DC ; Khmer # Lo KHMER SIGN AVAKRAHASANYA
+17DD ; Khmer # Mn KHMER SIGN ATTHACAN
+17E0..17E9 ; Khmer # Nd [10] KHMER DIGIT ZERO..KHMER DIGIT NINE
+17F0..17F9 ; Khmer # No [10] KHMER SYMBOL LEK ATTAK SON..KHMER SYMBOL LEK ATTAK PRAM-BUON
+19E0..19FF ; Khmer # So [32] KHMER SYMBOL PATHAMASAT..KHMER SYMBOL DAP-PRAM ROC
+
+# Total code points: 146
+
+# ================================================
+
+1800..1801 ; Mongolian # Po [2] MONGOLIAN BIRGA..MONGOLIAN ELLIPSIS
+1804 ; Mongolian # Po MONGOLIAN COLON
+1806 ; Mongolian # Pd MONGOLIAN TODO SOFT HYPHEN
+1807..180A ; Mongolian # Po [4] MONGOLIAN SIBE SYLLABLE BOUNDARY MARKER..MONGOLIAN NIRUGU
+180B..180D ; Mongolian # Mn [3] MONGOLIAN FREE VARIATION SELECTOR ONE..MONGOLIAN FREE VARIATION SELECTOR THREE
+180E ; Mongolian # Cf MONGOLIAN VOWEL SEPARATOR
+180F ; Mongolian # Mn MONGOLIAN FREE VARIATION SELECTOR FOUR
+1810..1819 ; Mongolian # Nd [10] MONGOLIAN DIGIT ZERO..MONGOLIAN DIGIT NINE
+1820..1842 ; Mongolian # Lo [35] MONGOLIAN LETTER A..MONGOLIAN LETTER CHI
+1843 ; Mongolian # Lm MONGOLIAN LETTER TODO LONG VOWEL SIGN
+1844..1878 ; Mongolian # Lo [53] MONGOLIAN LETTER TODO E..MONGOLIAN LETTER CHA WITH TWO DOTS
+1880..1884 ; Mongolian # Lo [5] MONGOLIAN LETTER ALI GALI ANUSVARA ONE..MONGOLIAN LETTER ALI GALI INVERTED UBADAMA
+1885..1886 ; Mongolian # Mn [2] MONGOLIAN LETTER ALI GALI BALUDA..MONGOLIAN LETTER ALI GALI THREE BALUDA
+1887..18A8 ; Mongolian # Lo [34] MONGOLIAN LETTER ALI GALI A..MONGOLIAN LETTER MANCHU ALI GALI BHA
+18A9 ; Mongolian # Mn MONGOLIAN LETTER ALI GALI DAGALGA
+18AA ; Mongolian # Lo MONGOLIAN LETTER MANCHU ALI GALI LHA
+11660..1166C ; Mongolian # Po [13] MONGOLIAN BIRGA WITH ORNAMENT..MONGOLIAN TURNED SWIRL BIRGA WITH DOUBLE ORNAMENT
+
+# Total code points: 168
+
+# ================================================
+
+3041..3096 ; Hiragana # Lo [86] HIRAGANA LETTER SMALL A..HIRAGANA LETTER SMALL KE
+309D..309E ; Hiragana # Lm [2] HIRAGANA ITERATION MARK..HIRAGANA VOICED ITERATION MARK
+309F ; Hiragana # Lo HIRAGANA DIGRAPH YORI
+1B001..1B11F ; Hiragana # Lo [287] HIRAGANA LETTER ARCHAIC YE..HIRAGANA LETTER ARCHAIC WU
+1B132 ; Hiragana # Lo HIRAGANA LETTER SMALL KO
+1B150..1B152 ; Hiragana # Lo [3] HIRAGANA LETTER SMALL WI..HIRAGANA LETTER SMALL WO
+1F200 ; Hiragana # So SQUARE HIRAGANA HOKA
+
+# Total code points: 381
+
+# ================================================
+
+30A1..30FA ; Katakana # Lo [90] KATAKANA LETTER SMALL A..KATAKANA LETTER VO
+30FD..30FE ; Katakana # Lm [2] KATAKANA ITERATION MARK..KATAKANA VOICED ITERATION MARK
+30FF ; Katakana # Lo KATAKANA DIGRAPH KOTO
+31F0..31FF ; Katakana # Lo [16] KATAKANA LETTER SMALL KU..KATAKANA LETTER SMALL RO
+32D0..32FE ; Katakana # So [47] CIRCLED KATAKANA A..CIRCLED KATAKANA WO
+3300..3357 ; Katakana # So [88] SQUARE APAATO..SQUARE WATTO
+FF66..FF6F ; Katakana # Lo [10] HALFWIDTH KATAKANA LETTER WO..HALFWIDTH KATAKANA LETTER SMALL TU
+FF71..FF9D ; Katakana # Lo [45] HALFWIDTH KATAKANA LETTER A..HALFWIDTH KATAKANA LETTER N
+1AFF0..1AFF3 ; Katakana # Lm [4] KATAKANA LETTER MINNAN TONE-2..KATAKANA LETTER MINNAN TONE-5
+1AFF5..1AFFB ; Katakana # Lm [7] KATAKANA LETTER MINNAN TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-5
+1AFFD..1AFFE ; Katakana # Lm [2] KATAKANA LETTER MINNAN NASALIZED TONE-7..KATAKANA LETTER MINNAN NASALIZED TONE-8
+1B000 ; Katakana # Lo KATAKANA LETTER ARCHAIC E
+1B120..1B122 ; Katakana # Lo [3] KATAKANA LETTER ARCHAIC YI..KATAKANA LETTER ARCHAIC WU
+1B155 ; Katakana # Lo KATAKANA LETTER SMALL KO
+1B164..1B167 ; Katakana # Lo [4] KATAKANA LETTER SMALL WI..KATAKANA LETTER SMALL N
+
+# Total code points: 321
+
+# ================================================
+
+02EA..02EB ; Bopomofo # Sk [2] MODIFIER LETTER YIN DEPARTING TONE MARK..MODIFIER LETTER YANG DEPARTING TONE MARK
+3105..312F ; Bopomofo # Lo [43] BOPOMOFO LETTER B..BOPOMOFO LETTER NN
+31A0..31BF ; Bopomofo # Lo [32] BOPOMOFO LETTER BU..BOPOMOFO LETTER AH
+
+# Total code points: 77
+
+# ================================================
+
+2E80..2E99 ; Han # So [26] CJK RADICAL REPEAT..CJK RADICAL RAP
+2E9B..2EF3 ; Han # So [89] CJK RADICAL CHOKE..CJK RADICAL C-SIMPLIFIED TURTLE
+2F00..2FD5 ; Han # So [214] KANGXI RADICAL ONE..KANGXI RADICAL FLUTE
+3005 ; Han # Lm IDEOGRAPHIC ITERATION MARK
+3007 ; Han # Nl IDEOGRAPHIC NUMBER ZERO
+3021..3029 ; Han # Nl [9] HANGZHOU NUMERAL ONE..HANGZHOU NUMERAL NINE
+3038..303A ; Han # Nl [3] HANGZHOU NUMERAL TEN..HANGZHOU NUMERAL THIRTY
+303B ; Han # Lm VERTICAL IDEOGRAPHIC ITERATION MARK
+3400..4DBF ; Han # Lo [6592] CJK UNIFIED IDEOGRAPH-3400..CJK UNIFIED IDEOGRAPH-4DBF
+4E00..9FFF ; Han # Lo [20992] CJK UNIFIED IDEOGRAPH-4E00..CJK UNIFIED IDEOGRAPH-9FFF
+F900..FA6D ; Han # Lo [366] CJK COMPATIBILITY IDEOGRAPH-F900..CJK COMPATIBILITY IDEOGRAPH-FA6D
+FA70..FAD9 ; Han # Lo [106] CJK COMPATIBILITY IDEOGRAPH-FA70..CJK COMPATIBILITY IDEOGRAPH-FAD9
+16FE2 ; Han # Po OLD CHINESE HOOK MARK
+16FE3 ; Han # Lm OLD CHINESE ITERATION MARK
+16FF0..16FF1 ; Han # Mc [2] VIETNAMESE ALTERNATE READING MARK CA..VIETNAMESE ALTERNATE READING MARK NHAY
+20000..2A6DF ; Han # Lo [42720] CJK UNIFIED IDEOGRAPH-20000..CJK UNIFIED IDEOGRAPH-2A6DF
+2A700..2B739 ; Han # Lo [4154] CJK UNIFIED IDEOGRAPH-2A700..CJK UNIFIED IDEOGRAPH-2B739
+2B740..2B81D ; Han # Lo [222] CJK UNIFIED IDEOGRAPH-2B740..CJK UNIFIED IDEOGRAPH-2B81D
+2B820..2CEA1 ; Han # Lo [5762] CJK UNIFIED IDEOGRAPH-2B820..CJK UNIFIED IDEOGRAPH-2CEA1
+2CEB0..2EBE0 ; Han # Lo [7473] CJK UNIFIED IDEOGRAPH-2CEB0..CJK UNIFIED IDEOGRAPH-2EBE0
+2EBF0..2EE5D ; Han # Lo [622] CJK UNIFIED IDEOGRAPH-2EBF0..CJK UNIFIED IDEOGRAPH-2EE5D
+2F800..2FA1D ; Han # Lo [542] CJK COMPATIBILITY IDEOGRAPH-2F800..CJK COMPATIBILITY IDEOGRAPH-2FA1D
+30000..3134A ; Han # Lo [4939] CJK UNIFIED IDEOGRAPH-30000..CJK UNIFIED IDEOGRAPH-3134A
+31350..323AF ; Han # Lo [4192] CJK UNIFIED IDEOGRAPH-31350..CJK UNIFIED IDEOGRAPH-323AF
+
+# Total code points: 99030
+
+# ================================================
+
+A000..A014 ; Yi # Lo [21] YI SYLLABLE IT..YI SYLLABLE E
+A015 ; Yi # Lm YI SYLLABLE WU
+A016..A48C ; Yi # Lo [1143] YI SYLLABLE BIT..YI SYLLABLE YYR
+A490..A4C6 ; Yi # So [55] YI RADICAL QOT..YI RADICAL KE
+
+# Total code points: 1220
+
+# ================================================
+
+10300..1031F ; Old_Italic # Lo [32] OLD ITALIC LETTER A..OLD ITALIC LETTER ESS
+10320..10323 ; Old_Italic # No [4] OLD ITALIC NUMERAL ONE..OLD ITALIC NUMERAL FIFTY
+1032D..1032F ; Old_Italic # Lo [3] OLD ITALIC LETTER YE..OLD ITALIC LETTER SOUTHERN TSE
+
+# Total code points: 39
+
+# ================================================
+
+10330..10340 ; Gothic # Lo [17] GOTHIC LETTER AHSA..GOTHIC LETTER PAIRTHRA
+10341 ; Gothic # Nl GOTHIC LETTER NINETY
+10342..10349 ; Gothic # Lo [8] GOTHIC LETTER RAIDA..GOTHIC LETTER OTHAL
+1034A ; Gothic # Nl GOTHIC LETTER NINE HUNDRED
+
+# Total code points: 27
+
+# ================================================
+
+10400..1044F ; Deseret # L& [80] DESERET CAPITAL LETTER LONG I..DESERET SMALL LETTER EW
+
+# Total code points: 80
+
+# ================================================
+
+0300..036F ; Inherited # Mn [112] COMBINING GRAVE ACCENT..COMBINING LATIN SMALL LETTER X
+0485..0486 ; Inherited # Mn [2] COMBINING CYRILLIC DASIA PNEUMATA..COMBINING CYRILLIC PSILI PNEUMATA
+064B..0655 ; Inherited # Mn [11] ARABIC FATHATAN..ARABIC HAMZA BELOW
+0670 ; Inherited # Mn ARABIC LETTER SUPERSCRIPT ALEF
+0951..0954 ; Inherited # Mn [4] DEVANAGARI STRESS SIGN UDATTA..DEVANAGARI ACUTE ACCENT
+1AB0..1ABD ; Inherited # Mn [14] COMBINING DOUBLED CIRCUMFLEX ACCENT..COMBINING PARENTHESES BELOW
+1ABE ; Inherited # Me COMBINING PARENTHESES OVERLAY
+1ABF..1ACE ; Inherited # Mn [16] COMBINING LATIN SMALL LETTER W BELOW..COMBINING LATIN SMALL LETTER INSULAR T
+1CD0..1CD2 ; Inherited # Mn [3] VEDIC TONE KARSHANA..VEDIC TONE PRENKHA
+1CD4..1CE0 ; Inherited # Mn [13] VEDIC SIGN YAJURVEDIC MIDLINE SVARITA..VEDIC TONE RIGVEDIC KASHMIRI INDEPENDENT SVARITA
+1CE2..1CE8 ; Inherited # Mn [7] VEDIC SIGN VISARGA SVARITA..VEDIC SIGN VISARGA ANUDATTA WITH TAIL
+1CED ; Inherited # Mn VEDIC SIGN TIRYAK
+1CF4 ; Inherited # Mn VEDIC TONE CANDRA ABOVE
+1CF8..1CF9 ; Inherited # Mn [2] VEDIC TONE RING ABOVE..VEDIC TONE DOUBLE RING ABOVE
+1DC0..1DFF ; Inherited # Mn [64] COMBINING DOTTED GRAVE ACCENT..COMBINING RIGHT ARROWHEAD AND DOWN ARROWHEAD BELOW
+200C..200D ; Inherited # Cf [2] ZERO WIDTH NON-JOINER..ZERO WIDTH JOINER
+20D0..20DC ; Inherited # Mn [13] COMBINING LEFT HARPOON ABOVE..COMBINING FOUR DOTS ABOVE
+20DD..20E0 ; Inherited # Me [4] COMBINING ENCLOSING CIRCLE..COMBINING ENCLOSING CIRCLE BACKSLASH
+20E1 ; Inherited # Mn COMBINING LEFT RIGHT ARROW ABOVE
+20E2..20E4 ; Inherited # Me [3] COMBINING ENCLOSING SCREEN..COMBINING ENCLOSING UPWARD POINTING TRIANGLE
+20E5..20F0 ; Inherited # Mn [12] COMBINING REVERSE SOLIDUS OVERLAY..COMBINING ASTERISK ABOVE
+302A..302D ; Inherited # Mn [4] IDEOGRAPHIC LEVEL TONE MARK..IDEOGRAPHIC ENTERING TONE MARK
+3099..309A ; Inherited # Mn [2] COMBINING KATAKANA-HIRAGANA VOICED SOUND MARK..COMBINING KATAKANA-HIRAGANA SEMI-VOICED SOUND MARK
+FE00..FE0F ; Inherited # Mn [16] VARIATION SELECTOR-1..VARIATION SELECTOR-16
+FE20..FE2D ; Inherited # Mn [14] COMBINING LIGATURE LEFT HALF..COMBINING CONJOINING MACRON BELOW
+101FD ; Inherited # Mn PHAISTOS DISC SIGN COMBINING OBLIQUE STROKE
+102E0 ; Inherited # Mn COPTIC EPACT THOUSANDS MARK
+1133B ; Inherited # Mn COMBINING BINDU BELOW
+1CF00..1CF2D ; Inherited # Mn [46] ZNAMENNY COMBINING MARK GORAZDO NIZKO S KRYZHEM ON LEFT..ZNAMENNY COMBINING MARK KRYZH ON LEFT
+1CF30..1CF46 ; Inherited # Mn [23] ZNAMENNY COMBINING TONAL RANGE MARK MRACHNO..ZNAMENNY PRIZNAK MODIFIER ROG
+1D167..1D169 ; Inherited # Mn [3] MUSICAL SYMBOL COMBINING TREMOLO-1..MUSICAL SYMBOL COMBINING TREMOLO-3
+1D17B..1D182 ; Inherited # Mn [8] MUSICAL SYMBOL COMBINING ACCENT..MUSICAL SYMBOL COMBINING LOURE
+1D185..1D18B ; Inherited # Mn [7] MUSICAL SYMBOL COMBINING DOIT..MUSICAL SYMBOL COMBINING TRIPLE TONGUE
+1D1AA..1D1AD ; Inherited # Mn [4] MUSICAL SYMBOL COMBINING DOWN BOW..MUSICAL SYMBOL COMBINING SNAP PIZZICATO
+E0100..E01EF ; Inherited # Mn [240] VARIATION SELECTOR-17..VARIATION SELECTOR-256
+
+# Total code points: 657
+
+# ================================================
+
+1700..1711 ; Tagalog # Lo [18] TAGALOG LETTER A..TAGALOG LETTER HA
+1712..1714 ; Tagalog # Mn [3] TAGALOG VOWEL SIGN I..TAGALOG SIGN VIRAMA
+1715 ; Tagalog # Mc TAGALOG SIGN PAMUDPOD
+171F ; Tagalog # Lo TAGALOG LETTER ARCHAIC RA
+
+# Total code points: 23
+
+# ================================================
+
+1720..1731 ; Hanunoo # Lo [18] HANUNOO LETTER A..HANUNOO LETTER HA
+1732..1733 ; Hanunoo # Mn [2] HANUNOO VOWEL SIGN I..HANUNOO VOWEL SIGN U
+1734 ; Hanunoo # Mc HANUNOO SIGN PAMUDPOD
+
+# Total code points: 21
+
+# ================================================
+
+1740..1751 ; Buhid # Lo [18] BUHID LETTER A..BUHID LETTER HA
+1752..1753 ; Buhid # Mn [2] BUHID VOWEL SIGN I..BUHID VOWEL SIGN U
+
+# Total code points: 20
+
+# ================================================
+
+1760..176C ; Tagbanwa # Lo [13] TAGBANWA LETTER A..TAGBANWA LETTER YA
+176E..1770 ; Tagbanwa # Lo [3] TAGBANWA LETTER LA..TAGBANWA LETTER SA
+1772..1773 ; Tagbanwa # Mn [2] TAGBANWA VOWEL SIGN I..TAGBANWA VOWEL SIGN U
+
+# Total code points: 18
+
+# ================================================
+
+1900..191E ; Limbu # Lo [31] LIMBU VOWEL-CARRIER LETTER..LIMBU LETTER TRA
+1920..1922 ; Limbu # Mn [3] LIMBU VOWEL SIGN A..LIMBU VOWEL SIGN U
+1923..1926 ; Limbu # Mc [4] LIMBU VOWEL SIGN EE..LIMBU VOWEL SIGN AU
+1927..1928 ; Limbu # Mn [2] LIMBU VOWEL SIGN E..LIMBU VOWEL SIGN O
+1929..192B ; Limbu # Mc [3] LIMBU SUBJOINED LETTER YA..LIMBU SUBJOINED LETTER WA
+1930..1931 ; Limbu # Mc [2] LIMBU SMALL LETTER KA..LIMBU SMALL LETTER NGA
+1932 ; Limbu # Mn LIMBU SMALL LETTER ANUSVARA
+1933..1938 ; Limbu # Mc [6] LIMBU SMALL LETTER TA..LIMBU SMALL LETTER LA
+1939..193B ; Limbu # Mn [3] LIMBU SIGN MUKPHRENG..LIMBU SIGN SA-I
+1940 ; Limbu # So LIMBU SIGN LOO
+1944..1945 ; Limbu # Po [2] LIMBU EXCLAMATION MARK..LIMBU QUESTION MARK
+1946..194F ; Limbu # Nd [10] LIMBU DIGIT ZERO..LIMBU DIGIT NINE
+
+# Total code points: 68
+
+# ================================================
+
+1950..196D ; Tai_Le # Lo [30] TAI LE LETTER KA..TAI LE LETTER AI
+1970..1974 ; Tai_Le # Lo [5] TAI LE LETTER TONE-2..TAI LE LETTER TONE-6
+
+# Total code points: 35
+
+# ================================================
+
+10000..1000B ; Linear_B # Lo [12] LINEAR B SYLLABLE B008 A..LINEAR B SYLLABLE B046 JE
+1000D..10026 ; Linear_B # Lo [26] LINEAR B SYLLABLE B036 JO..LINEAR B SYLLABLE B032 QO
+10028..1003A ; Linear_B # Lo [19] LINEAR B SYLLABLE B060 RA..LINEAR B SYLLABLE B042 WO
+1003C..1003D ; Linear_B # Lo [2] LINEAR B SYLLABLE B017 ZA..LINEAR B SYLLABLE B074 ZE
+1003F..1004D ; Linear_B # Lo [15] LINEAR B SYLLABLE B020 ZO..LINEAR B SYLLABLE B091 TWO
+10050..1005D ; Linear_B # Lo [14] LINEAR B SYMBOL B018..LINEAR B SYMBOL B089
+10080..100FA ; Linear_B # Lo [123] LINEAR B IDEOGRAM B100 MAN..LINEAR B IDEOGRAM VESSEL B305
+
+# Total code points: 211
+
+# ================================================
+
+10380..1039D ; Ugaritic # Lo [30] UGARITIC LETTER ALPA..UGARITIC LETTER SSU
+1039F ; Ugaritic # Po UGARITIC WORD DIVIDER
+
+# Total code points: 31
+
+# ================================================
+
+10450..1047F ; Shavian # Lo [48] SHAVIAN LETTER PEEP..SHAVIAN LETTER YEW
+
+# Total code points: 48
+
+# ================================================
+
+10480..1049D ; Osmanya # Lo [30] OSMANYA LETTER ALEF..OSMANYA LETTER OO
+104A0..104A9 ; Osmanya # Nd [10] OSMANYA DIGIT ZERO..OSMANYA DIGIT NINE
+
+# Total code points: 40
+
+# ================================================
+
+10800..10805 ; Cypriot # Lo [6] CYPRIOT SYLLABLE A..CYPRIOT SYLLABLE JA
+10808 ; Cypriot # Lo CYPRIOT SYLLABLE JO
+1080A..10835 ; Cypriot # Lo [44] CYPRIOT SYLLABLE KA..CYPRIOT SYLLABLE WO
+10837..10838 ; Cypriot # Lo [2] CYPRIOT SYLLABLE XA..CYPRIOT SYLLABLE XE
+1083C ; Cypriot # Lo CYPRIOT SYLLABLE ZA
+1083F ; Cypriot # Lo CYPRIOT SYLLABLE ZO
+
+# Total code points: 55
+
+# ================================================
+
+2800..28FF ; Braille # So [256] BRAILLE PATTERN BLANK..BRAILLE PATTERN DOTS-12345678
+
+# Total code points: 256
+
+# ================================================
+
+1A00..1A16 ; Buginese # Lo [23] BUGINESE LETTER KA..BUGINESE LETTER HA
+1A17..1A18 ; Buginese # Mn [2] BUGINESE VOWEL SIGN I..BUGINESE VOWEL SIGN U
+1A19..1A1A ; Buginese # Mc [2] BUGINESE VOWEL SIGN E..BUGINESE VOWEL SIGN O
+1A1B ; Buginese # Mn BUGINESE VOWEL SIGN AE
+1A1E..1A1F ; Buginese # Po [2] BUGINESE PALLAWA..BUGINESE END OF SECTION
+
+# Total code points: 30
+
+# ================================================
+
+03E2..03EF ; Coptic # L& [14] COPTIC CAPITAL LETTER SHEI..COPTIC SMALL LETTER DEI
+2C80..2CE4 ; Coptic # L& [101] COPTIC CAPITAL LETTER ALFA..COPTIC SYMBOL KAI
+2CE5..2CEA ; Coptic # So [6] COPTIC SYMBOL MI RO..COPTIC SYMBOL SHIMA SIMA
+2CEB..2CEE ; Coptic # L& [4] COPTIC CAPITAL LETTER CRYPTOGRAMMIC SHEI..COPTIC SMALL LETTER CRYPTOGRAMMIC GANGIA
+2CEF..2CF1 ; Coptic # Mn [3] COPTIC COMBINING NI ABOVE..COPTIC COMBINING SPIRITUS LENIS
+2CF2..2CF3 ; Coptic # L& [2] COPTIC CAPITAL LETTER BOHAIRIC KHEI..COPTIC SMALL LETTER BOHAIRIC KHEI
+2CF9..2CFC ; Coptic # Po [4] COPTIC OLD NUBIAN FULL STOP..COPTIC OLD NUBIAN VERSE DIVIDER
+2CFD ; Coptic # No COPTIC FRACTION ONE HALF
+2CFE..2CFF ; Coptic # Po [2] COPTIC FULL STOP..COPTIC MORPHOLOGICAL DIVIDER
+
+# Total code points: 137
+
+# ================================================
+
+1980..19AB ; New_Tai_Lue # Lo [44] NEW TAI LUE LETTER HIGH QA..NEW TAI LUE LETTER LOW SUA
+19B0..19C9 ; New_Tai_Lue # Lo [26] NEW TAI LUE VOWEL SIGN VOWEL SHORTENER..NEW TAI LUE TONE MARK-2
+19D0..19D9 ; New_Tai_Lue # Nd [10] NEW TAI LUE DIGIT ZERO..NEW TAI LUE DIGIT NINE
+19DA ; New_Tai_Lue # No NEW TAI LUE THAM DIGIT ONE
+19DE..19DF ; New_Tai_Lue # So [2] NEW TAI LUE SIGN LAE..NEW TAI LUE SIGN LAEV
+
+# Total code points: 83
+
+# ================================================
+
+2C00..2C5F ; Glagolitic # L& [96] GLAGOLITIC CAPITAL LETTER AZU..GLAGOLITIC SMALL LETTER CAUDATE CHRIVI
+1E000..1E006 ; Glagolitic # Mn [7] COMBINING GLAGOLITIC LETTER AZU..COMBINING GLAGOLITIC LETTER ZHIVETE
+1E008..1E018 ; Glagolitic # Mn [17] COMBINING GLAGOLITIC LETTER ZEMLJA..COMBINING GLAGOLITIC LETTER HERU
+1E01B..1E021 ; Glagolitic # Mn [7] COMBINING GLAGOLITIC LETTER SHTA..COMBINING GLAGOLITIC LETTER YATI
+1E023..1E024 ; Glagolitic # Mn [2] COMBINING GLAGOLITIC LETTER YU..COMBINING GLAGOLITIC LETTER SMALL YUS
+1E026..1E02A ; Glagolitic # Mn [5] COMBINING GLAGOLITIC LETTER YO..COMBINING GLAGOLITIC LETTER FITA
+
+# Total code points: 134
+
+# ================================================
+
+2D30..2D67 ; Tifinagh # Lo [56] TIFINAGH LETTER YA..TIFINAGH LETTER YO
+2D6F ; Tifinagh # Lm TIFINAGH MODIFIER LETTER LABIALIZATION MARK
+2D70 ; Tifinagh # Po TIFINAGH SEPARATOR MARK
+2D7F ; Tifinagh # Mn TIFINAGH CONSONANT JOINER
+
+# Total code points: 59
+
+# ================================================
+
+A800..A801 ; Syloti_Nagri # Lo [2] SYLOTI NAGRI LETTER A..SYLOTI NAGRI LETTER I
+A802 ; Syloti_Nagri # Mn SYLOTI NAGRI SIGN DVISVARA
+A803..A805 ; Syloti_Nagri # Lo [3] SYLOTI NAGRI LETTER U..SYLOTI NAGRI LETTER O
+A806 ; Syloti_Nagri # Mn SYLOTI NAGRI SIGN HASANTA
+A807..A80A ; Syloti_Nagri # Lo [4] SYLOTI NAGRI LETTER KO..SYLOTI NAGRI LETTER GHO
+A80B ; Syloti_Nagri # Mn SYLOTI NAGRI SIGN ANUSVARA
+A80C..A822 ; Syloti_Nagri # Lo [23] SYLOTI NAGRI LETTER CO..SYLOTI NAGRI LETTER HO
+A823..A824 ; Syloti_Nagri # Mc [2] SYLOTI NAGRI VOWEL SIGN A..SYLOTI NAGRI VOWEL SIGN I
+A825..A826 ; Syloti_Nagri # Mn [2] SYLOTI NAGRI VOWEL SIGN U..SYLOTI NAGRI VOWEL SIGN E
+A827 ; Syloti_Nagri # Mc SYLOTI NAGRI VOWEL SIGN OO
+A828..A82B ; Syloti_Nagri # So [4] SYLOTI NAGRI POETRY MARK-1..SYLOTI NAGRI POETRY MARK-4
+A82C ; Syloti_Nagri # Mn SYLOTI NAGRI SIGN ALTERNATE HASANTA
+
+# Total code points: 45
+
+# ================================================
+
+103A0..103C3 ; Old_Persian # Lo [36] OLD PERSIAN SIGN A..OLD PERSIAN SIGN HA
+103C8..103CF ; Old_Persian # Lo [8] OLD PERSIAN SIGN AURAMAZDAA..OLD PERSIAN SIGN BUUMISH
+103D0 ; Old_Persian # Po OLD PERSIAN WORD DIVIDER
+103D1..103D5 ; Old_Persian # Nl [5] OLD PERSIAN NUMBER ONE..OLD PERSIAN NUMBER HUNDRED
+
+# Total code points: 50
+
+# ================================================
+
+10A00 ; Kharoshthi # Lo KHAROSHTHI LETTER A
+10A01..10A03 ; Kharoshthi # Mn [3] KHAROSHTHI VOWEL SIGN I..KHAROSHTHI VOWEL SIGN VOCALIC R
+10A05..10A06 ; Kharoshthi # Mn [2] KHAROSHTHI VOWEL SIGN E..KHAROSHTHI VOWEL SIGN O
+10A0C..10A0F ; Kharoshthi # Mn [4] KHAROSHTHI VOWEL LENGTH MARK..KHAROSHTHI SIGN VISARGA
+10A10..10A13 ; Kharoshthi # Lo [4] KHAROSHTHI LETTER KA..KHAROSHTHI LETTER GHA
+10A15..10A17 ; Kharoshthi # Lo [3] KHAROSHTHI LETTER CA..KHAROSHTHI LETTER JA
+10A19..10A35 ; Kharoshthi # Lo [29] KHAROSHTHI LETTER NYA..KHAROSHTHI LETTER VHA
+10A38..10A3A ; Kharoshthi # Mn [3] KHAROSHTHI SIGN BAR ABOVE..KHAROSHTHI SIGN DOT BELOW
+10A3F ; Kharoshthi # Mn KHAROSHTHI VIRAMA
+10A40..10A48 ; Kharoshthi # No [9] KHAROSHTHI DIGIT ONE..KHAROSHTHI FRACTION ONE HALF
+10A50..10A58 ; Kharoshthi # Po [9] KHAROSHTHI PUNCTUATION DOT..KHAROSHTHI PUNCTUATION LINES
+
+# Total code points: 68
+
+# ================================================
+
+1B00..1B03 ; Balinese # Mn [4] BALINESE SIGN ULU RICEM..BALINESE SIGN SURANG
+1B04 ; Balinese # Mc BALINESE SIGN BISAH
+1B05..1B33 ; Balinese # Lo [47] BALINESE LETTER AKARA..BALINESE LETTER HA
+1B34 ; Balinese # Mn BALINESE SIGN REREKAN
+1B35 ; Balinese # Mc BALINESE VOWEL SIGN TEDUNG
+1B36..1B3A ; Balinese # Mn [5] BALINESE VOWEL SIGN ULU..BALINESE VOWEL SIGN RA REPA
+1B3B ; Balinese # Mc BALINESE VOWEL SIGN RA REPA TEDUNG
+1B3C ; Balinese # Mn BALINESE VOWEL SIGN LA LENGA
+1B3D..1B41 ; Balinese # Mc [5] BALINESE VOWEL SIGN LA LENGA TEDUNG..BALINESE VOWEL SIGN TALING REPA TEDUNG
+1B42 ; Balinese # Mn BALINESE VOWEL SIGN PEPET
+1B43..1B44 ; Balinese # Mc [2] BALINESE VOWEL SIGN PEPET TEDUNG..BALINESE ADEG ADEG
+1B45..1B4C ; Balinese # Lo [8] BALINESE LETTER KAF SASAK..BALINESE LETTER ARCHAIC JNYA
+1B50..1B59 ; Balinese # Nd [10] BALINESE DIGIT ZERO..BALINESE DIGIT NINE
+1B5A..1B60 ; Balinese # Po [7] BALINESE PANTI..BALINESE PAMENENG
+1B61..1B6A ; Balinese # So [10] BALINESE MUSICAL SYMBOL DONG..BALINESE MUSICAL SYMBOL DANG GEDE
+1B6B..1B73 ; Balinese # Mn [9] BALINESE MUSICAL SYMBOL COMBINING TEGEH..BALINESE MUSICAL SYMBOL COMBINING GONG
+1B74..1B7C ; Balinese # So [9] BALINESE MUSICAL SYMBOL RIGHT-HAND OPEN DUG..BALINESE MUSICAL SYMBOL LEFT-HAND OPEN PING
+1B7D..1B7E ; Balinese # Po [2] BALINESE PANTI LANTANG..BALINESE PAMADA LANTANG
+
+# Total code points: 124
+
+# ================================================
+
+12000..12399 ; Cuneiform # Lo [922] CUNEIFORM SIGN A..CUNEIFORM SIGN U U
+12400..1246E ; Cuneiform # Nl [111] CUNEIFORM NUMERIC SIGN TWO ASH..CUNEIFORM NUMERIC SIGN NINE U VARIANT FORM
+12470..12474 ; Cuneiform # Po [5] CUNEIFORM PUNCTUATION SIGN OLD ASSYRIAN WORD DIVIDER..CUNEIFORM PUNCTUATION SIGN DIAGONAL QUADCOLON
+12480..12543 ; Cuneiform # Lo [196] CUNEIFORM SIGN AB TIMES NUN TENU..CUNEIFORM SIGN ZU5 TIMES THREE DISH TENU
+
+# Total code points: 1234
+
+# ================================================
+
+10900..10915 ; Phoenician # Lo [22] PHOENICIAN LETTER ALF..PHOENICIAN LETTER TAU
+10916..1091B ; Phoenician # No [6] PHOENICIAN NUMBER ONE..PHOENICIAN NUMBER THREE
+1091F ; Phoenician # Po PHOENICIAN WORD SEPARATOR
+
+# Total code points: 29
+
+# ================================================
+
+A840..A873 ; Phags_Pa # Lo [52] PHAGS-PA LETTER KA..PHAGS-PA LETTER CANDRABINDU
+A874..A877 ; Phags_Pa # Po [4] PHAGS-PA SINGLE HEAD MARK..PHAGS-PA MARK DOUBLE SHAD
+
+# Total code points: 56
+
+# ================================================
+
+07C0..07C9 ; Nko # Nd [10] NKO DIGIT ZERO..NKO DIGIT NINE
+07CA..07EA ; Nko # Lo [33] NKO LETTER A..NKO LETTER JONA RA
+07EB..07F3 ; Nko # Mn [9] NKO COMBINING SHORT HIGH TONE..NKO COMBINING DOUBLE DOT ABOVE
+07F4..07F5 ; Nko # Lm [2] NKO HIGH TONE APOSTROPHE..NKO LOW TONE APOSTROPHE
+07F6 ; Nko # So NKO SYMBOL OO DENNEN
+07F7..07F9 ; Nko # Po [3] NKO SYMBOL GBAKURUNEN..NKO EXCLAMATION MARK
+07FA ; Nko # Lm NKO LAJANYALAN
+07FD ; Nko # Mn NKO DANTAYALAN
+07FE..07FF ; Nko # Sc [2] NKO DOROME SIGN..NKO TAMAN SIGN
+
+# Total code points: 62
+
+# ================================================
+
+1B80..1B81 ; Sundanese # Mn [2] SUNDANESE SIGN PANYECEK..SUNDANESE SIGN PANGLAYAR
+1B82 ; Sundanese # Mc SUNDANESE SIGN PANGWISAD
+1B83..1BA0 ; Sundanese # Lo [30] SUNDANESE LETTER A..SUNDANESE LETTER HA
+1BA1 ; Sundanese # Mc SUNDANESE CONSONANT SIGN PAMINGKAL
+1BA2..1BA5 ; Sundanese # Mn [4] SUNDANESE CONSONANT SIGN PANYAKRA..SUNDANESE VOWEL SIGN PANYUKU
+1BA6..1BA7 ; Sundanese # Mc [2] SUNDANESE VOWEL SIGN PANAELAENG..SUNDANESE VOWEL SIGN PANOLONG
+1BA8..1BA9 ; Sundanese # Mn [2] SUNDANESE VOWEL SIGN PAMEPET..SUNDANESE VOWEL SIGN PANEULEUNG
+1BAA ; Sundanese # Mc SUNDANESE SIGN PAMAAEH
+1BAB..1BAD ; Sundanese # Mn [3] SUNDANESE SIGN VIRAMA..SUNDANESE CONSONANT SIGN PASANGAN WA
+1BAE..1BAF ; Sundanese # Lo [2] SUNDANESE LETTER KHA..SUNDANESE LETTER SYA
+1BB0..1BB9 ; Sundanese # Nd [10] SUNDANESE DIGIT ZERO..SUNDANESE DIGIT NINE
+1BBA..1BBF ; Sundanese # Lo [6] SUNDANESE AVAGRAHA..SUNDANESE LETTER FINAL M
+1CC0..1CC7 ; Sundanese # Po [8] SUNDANESE PUNCTUATION BINDU SURYA..SUNDANESE PUNCTUATION BINDU BA SATANGA
+
+# Total code points: 72
+
+# ================================================
+
+1C00..1C23 ; Lepcha # Lo [36] LEPCHA LETTER KA..LEPCHA LETTER A
+1C24..1C2B ; Lepcha # Mc [8] LEPCHA SUBJOINED LETTER YA..LEPCHA VOWEL SIGN UU
+1C2C..1C33 ; Lepcha # Mn [8] LEPCHA VOWEL SIGN E..LEPCHA CONSONANT SIGN T
+1C34..1C35 ; Lepcha # Mc [2] LEPCHA CONSONANT SIGN NYIN-DO..LEPCHA CONSONANT SIGN KANG
+1C36..1C37 ; Lepcha # Mn [2] LEPCHA SIGN RAN..LEPCHA SIGN NUKTA
+1C3B..1C3F ; Lepcha # Po [5] LEPCHA PUNCTUATION TA-ROL..LEPCHA PUNCTUATION TSHOOK
+1C40..1C49 ; Lepcha # Nd [10] LEPCHA DIGIT ZERO..LEPCHA DIGIT NINE
+1C4D..1C4F ; Lepcha # Lo [3] LEPCHA LETTER TTA..LEPCHA LETTER DDA
+
+# Total code points: 74
+
+# ================================================
+
+1C50..1C59 ; Ol_Chiki # Nd [10] OL CHIKI DIGIT ZERO..OL CHIKI DIGIT NINE
+1C5A..1C77 ; Ol_Chiki # Lo [30] OL CHIKI LETTER LA..OL CHIKI LETTER OH
+1C78..1C7D ; Ol_Chiki # Lm [6] OL CHIKI MU TTUDDAG..OL CHIKI AHAD
+1C7E..1C7F ; Ol_Chiki # Po [2] OL CHIKI PUNCTUATION MUCAAD..OL CHIKI PUNCTUATION DOUBLE MUCAAD
+
+# Total code points: 48
+
+# ================================================
+
+A500..A60B ; Vai # Lo [268] VAI SYLLABLE EE..VAI SYLLABLE NG
+A60C ; Vai # Lm VAI SYLLABLE LENGTHENER
+A60D..A60F ; Vai # Po [3] VAI COMMA..VAI QUESTION MARK
+A610..A61F ; Vai # Lo [16] VAI SYLLABLE NDOLE FA..VAI SYMBOL JONG
+A620..A629 ; Vai # Nd [10] VAI DIGIT ZERO..VAI DIGIT NINE
+A62A..A62B ; Vai # Lo [2] VAI SYLLABLE NDOLE MA..VAI SYLLABLE NDOLE DO
+
+# Total code points: 300
+
+# ================================================
+
+A880..A881 ; Saurashtra # Mc [2] SAURASHTRA SIGN ANUSVARA..SAURASHTRA SIGN VISARGA
+A882..A8B3 ; Saurashtra # Lo [50] SAURASHTRA LETTER A..SAURASHTRA LETTER LLA
+A8B4..A8C3 ; Saurashtra # Mc [16] SAURASHTRA CONSONANT SIGN HAARU..SAURASHTRA VOWEL SIGN AU
+A8C4..A8C5 ; Saurashtra # Mn [2] SAURASHTRA SIGN VIRAMA..SAURASHTRA SIGN CANDRABINDU
+A8CE..A8CF ; Saurashtra # Po [2] SAURASHTRA DANDA..SAURASHTRA DOUBLE DANDA
+A8D0..A8D9 ; Saurashtra # Nd [10] SAURASHTRA DIGIT ZERO..SAURASHTRA DIGIT NINE
+
+# Total code points: 82
+
+# ================================================
+
+A900..A909 ; Kayah_Li # Nd [10] KAYAH LI DIGIT ZERO..KAYAH LI DIGIT NINE
+A90A..A925 ; Kayah_Li # Lo [28] KAYAH LI LETTER KA..KAYAH LI LETTER OO
+A926..A92D ; Kayah_Li # Mn [8] KAYAH LI VOWEL UE..KAYAH LI TONE CALYA PLOPHU
+A92F ; Kayah_Li # Po KAYAH LI SIGN SHYA
+
+# Total code points: 47
+
+# ================================================
+
+A930..A946 ; Rejang # Lo [23] REJANG LETTER KA..REJANG LETTER A
+A947..A951 ; Rejang # Mn [11] REJANG VOWEL SIGN I..REJANG CONSONANT SIGN R
+A952..A953 ; Rejang # Mc [2] REJANG CONSONANT SIGN H..REJANG VIRAMA
+A95F ; Rejang # Po REJANG SECTION MARK
+
+# Total code points: 37
+
+# ================================================
+
+10280..1029C ; Lycian # Lo [29] LYCIAN LETTER A..LYCIAN LETTER X
+
+# Total code points: 29
+
+# ================================================
+
+102A0..102D0 ; Carian # Lo [49] CARIAN LETTER A..CARIAN LETTER UUU3
+
+# Total code points: 49
+
+# ================================================
+
+10920..10939 ; Lydian # Lo [26] LYDIAN LETTER A..LYDIAN LETTER C
+1093F ; Lydian # Po LYDIAN TRIANGULAR MARK
+
+# Total code points: 27
+
+# ================================================
+
+AA00..AA28 ; Cham # Lo [41] CHAM LETTER A..CHAM LETTER HA
+AA29..AA2E ; Cham # Mn [6] CHAM VOWEL SIGN AA..CHAM VOWEL SIGN OE
+AA2F..AA30 ; Cham # Mc [2] CHAM VOWEL SIGN O..CHAM VOWEL SIGN AI
+AA31..AA32 ; Cham # Mn [2] CHAM VOWEL SIGN AU..CHAM VOWEL SIGN UE
+AA33..AA34 ; Cham # Mc [2] CHAM CONSONANT SIGN YA..CHAM CONSONANT SIGN RA
+AA35..AA36 ; Cham # Mn [2] CHAM CONSONANT SIGN LA..CHAM CONSONANT SIGN WA
+AA40..AA42 ; Cham # Lo [3] CHAM LETTER FINAL K..CHAM LETTER FINAL NG
+AA43 ; Cham # Mn CHAM CONSONANT SIGN FINAL NG
+AA44..AA4B ; Cham # Lo [8] CHAM LETTER FINAL CH..CHAM LETTER FINAL SS
+AA4C ; Cham # Mn CHAM CONSONANT SIGN FINAL M
+AA4D ; Cham # Mc CHAM CONSONANT SIGN FINAL H
+AA50..AA59 ; Cham # Nd [10] CHAM DIGIT ZERO..CHAM DIGIT NINE
+AA5C..AA5F ; Cham # Po [4] CHAM PUNCTUATION SPIRAL..CHAM PUNCTUATION TRIPLE DANDA
+
+# Total code points: 83
+
+# ================================================
+
+1A20..1A54 ; Tai_Tham # Lo [53] TAI THAM LETTER HIGH KA..TAI THAM LETTER GREAT SA
+1A55 ; Tai_Tham # Mc TAI THAM CONSONANT SIGN MEDIAL RA
+1A56 ; Tai_Tham # Mn TAI THAM CONSONANT SIGN MEDIAL LA
+1A57 ; Tai_Tham # Mc TAI THAM CONSONANT SIGN LA TANG LAI
+1A58..1A5E ; Tai_Tham # Mn [7] TAI THAM SIGN MAI KANG LAI..TAI THAM CONSONANT SIGN SA
+1A60 ; Tai_Tham # Mn TAI THAM SIGN SAKOT
+1A61 ; Tai_Tham # Mc TAI THAM VOWEL SIGN A
+1A62 ; Tai_Tham # Mn TAI THAM VOWEL SIGN MAI SAT
+1A63..1A64 ; Tai_Tham # Mc [2] TAI THAM VOWEL SIGN AA..TAI THAM VOWEL SIGN TALL AA
+1A65..1A6C ; Tai_Tham # Mn [8] TAI THAM VOWEL SIGN I..TAI THAM VOWEL SIGN OA BELOW
+1A6D..1A72 ; Tai_Tham # Mc [6] TAI THAM VOWEL SIGN OY..TAI THAM VOWEL SIGN THAM AI
+1A73..1A7C ; Tai_Tham # Mn [10] TAI THAM VOWEL SIGN OA ABOVE..TAI THAM SIGN KHUEN-LUE KARAN
+1A7F ; Tai_Tham # Mn TAI THAM COMBINING CRYPTOGRAMMIC DOT
+1A80..1A89 ; Tai_Tham # Nd [10] TAI THAM HORA DIGIT ZERO..TAI THAM HORA DIGIT NINE
+1A90..1A99 ; Tai_Tham # Nd [10] TAI THAM THAM DIGIT ZERO..TAI THAM THAM DIGIT NINE
+1AA0..1AA6 ; Tai_Tham # Po [7] TAI THAM SIGN WIANG..TAI THAM SIGN REVERSED ROTATED RANA
+1AA7 ; Tai_Tham # Lm TAI THAM SIGN MAI YAMOK
+1AA8..1AAD ; Tai_Tham # Po [6] TAI THAM SIGN KAAN..TAI THAM SIGN CAANG
+
+# Total code points: 127
+
+# ================================================
+
+AA80..AAAF ; Tai_Viet # Lo [48] TAI VIET LETTER LOW KO..TAI VIET LETTER HIGH O
+AAB0 ; Tai_Viet # Mn TAI VIET MAI KANG
+AAB1 ; Tai_Viet # Lo TAI VIET VOWEL AA
+AAB2..AAB4 ; Tai_Viet # Mn [3] TAI VIET VOWEL I..TAI VIET VOWEL U
+AAB5..AAB6 ; Tai_Viet # Lo [2] TAI VIET VOWEL E..TAI VIET VOWEL O
+AAB7..AAB8 ; Tai_Viet # Mn [2] TAI VIET MAI KHIT..TAI VIET VOWEL IA
+AAB9..AABD ; Tai_Viet # Lo [5] TAI VIET VOWEL UEA..TAI VIET VOWEL AN
+AABE..AABF ; Tai_Viet # Mn [2] TAI VIET VOWEL AM..TAI VIET TONE MAI EK
+AAC0 ; Tai_Viet # Lo TAI VIET TONE MAI NUENG
+AAC1 ; Tai_Viet # Mn TAI VIET TONE MAI THO
+AAC2 ; Tai_Viet # Lo TAI VIET TONE MAI SONG
+AADB..AADC ; Tai_Viet # Lo [2] TAI VIET SYMBOL KON..TAI VIET SYMBOL NUENG
+AADD ; Tai_Viet # Lm TAI VIET SYMBOL SAM
+AADE..AADF ; Tai_Viet # Po [2] TAI VIET SYMBOL HO HOI..TAI VIET SYMBOL KOI KOI
+
+# Total code points: 72
+
+# ================================================
+
+10B00..10B35 ; Avestan # Lo [54] AVESTAN LETTER A..AVESTAN LETTER HE
+10B39..10B3F ; Avestan # Po [7] AVESTAN ABBREVIATION MARK..LARGE ONE RING OVER TWO RINGS PUNCTUATION
+
+# Total code points: 61
+
+# ================================================
+
+13000..1342F ; Egyptian_Hieroglyphs # Lo [1072] EGYPTIAN HIEROGLYPH A001..EGYPTIAN HIEROGLYPH V011D
+13430..1343F ; Egyptian_Hieroglyphs # Cf [16] EGYPTIAN HIEROGLYPH VERTICAL JOINER..EGYPTIAN HIEROGLYPH END WALLED ENCLOSURE
+13440 ; Egyptian_Hieroglyphs # Mn EGYPTIAN HIEROGLYPH MIRROR HORIZONTALLY
+13441..13446 ; Egyptian_Hieroglyphs # Lo [6] EGYPTIAN HIEROGLYPH FULL BLANK..EGYPTIAN HIEROGLYPH WIDE LOST SIGN
+13447..13455 ; Egyptian_Hieroglyphs # Mn [15] EGYPTIAN HIEROGLYPH MODIFIER DAMAGED AT TOP START..EGYPTIAN HIEROGLYPH MODIFIER DAMAGED
+
+# Total code points: 1110
+
+# ================================================
+
+0800..0815 ; Samaritan # Lo [22] SAMARITAN LETTER ALAF..SAMARITAN LETTER TAAF
+0816..0819 ; Samaritan # Mn [4] SAMARITAN MARK IN..SAMARITAN MARK DAGESH
+081A ; Samaritan # Lm SAMARITAN MODIFIER LETTER EPENTHETIC YUT
+081B..0823 ; Samaritan # Mn [9] SAMARITAN MARK EPENTHETIC YUT..SAMARITAN VOWEL SIGN A
+0824 ; Samaritan # Lm SAMARITAN MODIFIER LETTER SHORT A
+0825..0827 ; Samaritan # Mn [3] SAMARITAN VOWEL SIGN SHORT A..SAMARITAN VOWEL SIGN U
+0828 ; Samaritan # Lm SAMARITAN MODIFIER LETTER I
+0829..082D ; Samaritan # Mn [5] SAMARITAN VOWEL SIGN LONG I..SAMARITAN MARK NEQUDAA
+0830..083E ; Samaritan # Po [15] SAMARITAN PUNCTUATION NEQUDAA..SAMARITAN PUNCTUATION ANNAAU
+
+# Total code points: 61
+
+# ================================================
+
+A4D0..A4F7 ; Lisu # Lo [40] LISU LETTER BA..LISU LETTER OE
+A4F8..A4FD ; Lisu # Lm [6] LISU LETTER TONE MYA TI..LISU LETTER TONE MYA JEU
+A4FE..A4FF ; Lisu # Po [2] LISU PUNCTUATION COMMA..LISU PUNCTUATION FULL STOP
+11FB0 ; Lisu # Lo LISU LETTER YHA
+
+# Total code points: 49
+
+# ================================================
+
+A6A0..A6E5 ; Bamum # Lo [70] BAMUM LETTER A..BAMUM LETTER KI
+A6E6..A6EF ; Bamum # Nl [10] BAMUM LETTER MO..BAMUM LETTER KOGHOM
+A6F0..A6F1 ; Bamum # Mn [2] BAMUM COMBINING MARK KOQNDON..BAMUM COMBINING MARK TUKWENTIS
+A6F2..A6F7 ; Bamum # Po [6] BAMUM NJAEMLI..BAMUM QUESTION MARK
+16800..16A38 ; Bamum # Lo [569] BAMUM LETTER PHASE-A NGKUE MFON..BAMUM LETTER PHASE-F VUEQ
+
+# Total code points: 657
+
+# ================================================
+
+A980..A982 ; Javanese # Mn [3] JAVANESE SIGN PANYANGGA..JAVANESE SIGN LAYAR
+A983 ; Javanese # Mc JAVANESE SIGN WIGNYAN
+A984..A9B2 ; Javanese # Lo [47] JAVANESE LETTER A..JAVANESE LETTER HA
+A9B3 ; Javanese # Mn JAVANESE SIGN CECAK TELU
+A9B4..A9B5 ; Javanese # Mc [2] JAVANESE VOWEL SIGN TARUNG..JAVANESE VOWEL SIGN TOLONG
+A9B6..A9B9 ; Javanese # Mn [4] JAVANESE VOWEL SIGN WULU..JAVANESE VOWEL SIGN SUKU MENDUT
+A9BA..A9BB ; Javanese # Mc [2] JAVANESE VOWEL SIGN TALING..JAVANESE VOWEL SIGN DIRGA MURE
+A9BC..A9BD ; Javanese # Mn [2] JAVANESE VOWEL SIGN PEPET..JAVANESE CONSONANT SIGN KERET
+A9BE..A9C0 ; Javanese # Mc [3] JAVANESE CONSONANT SIGN PENGKAL..JAVANESE PANGKON
+A9C1..A9CD ; Javanese # Po [13] JAVANESE LEFT RERENGGAN..JAVANESE TURNED PADA PISELEH
+A9D0..A9D9 ; Javanese # Nd [10] JAVANESE DIGIT ZERO..JAVANESE DIGIT NINE
+A9DE..A9DF ; Javanese # Po [2] JAVANESE PADA TIRTA TUMETES..JAVANESE PADA ISEN-ISEN
+
+# Total code points: 90
+
+# ================================================
+
+AAE0..AAEA ; Meetei_Mayek # Lo [11] MEETEI MAYEK LETTER E..MEETEI MAYEK LETTER SSA
+AAEB ; Meetei_Mayek # Mc MEETEI MAYEK VOWEL SIGN II
+AAEC..AAED ; Meetei_Mayek # Mn [2] MEETEI MAYEK VOWEL SIGN UU..MEETEI MAYEK VOWEL SIGN AAI
+AAEE..AAEF ; Meetei_Mayek # Mc [2] MEETEI MAYEK VOWEL SIGN AU..MEETEI MAYEK VOWEL SIGN AAU
+AAF0..AAF1 ; Meetei_Mayek # Po [2] MEETEI MAYEK CHEIKHAN..MEETEI MAYEK AHANG KHUDAM
+AAF2 ; Meetei_Mayek # Lo MEETEI MAYEK ANJI
+AAF3..AAF4 ; Meetei_Mayek # Lm [2] MEETEI MAYEK SYLLABLE REPETITION MARK..MEETEI MAYEK WORD REPETITION MARK
+AAF5 ; Meetei_Mayek # Mc MEETEI MAYEK VOWEL SIGN VISARGA
+AAF6 ; Meetei_Mayek # Mn MEETEI MAYEK VIRAMA
+ABC0..ABE2 ; Meetei_Mayek # Lo [35] MEETEI MAYEK LETTER KOK..MEETEI MAYEK LETTER I LONSUM
+ABE3..ABE4 ; Meetei_Mayek # Mc [2] MEETEI MAYEK VOWEL SIGN ONAP..MEETEI MAYEK VOWEL SIGN INAP
+ABE5 ; Meetei_Mayek # Mn MEETEI MAYEK VOWEL SIGN ANAP
+ABE6..ABE7 ; Meetei_Mayek # Mc [2] MEETEI MAYEK VOWEL SIGN YENAP..MEETEI MAYEK VOWEL SIGN SOUNAP
+ABE8 ; Meetei_Mayek # Mn MEETEI MAYEK VOWEL SIGN UNAP
+ABE9..ABEA ; Meetei_Mayek # Mc [2] MEETEI MAYEK VOWEL SIGN CHEINAP..MEETEI MAYEK VOWEL SIGN NUNG
+ABEB ; Meetei_Mayek # Po MEETEI MAYEK CHEIKHEI
+ABEC ; Meetei_Mayek # Mc MEETEI MAYEK LUM IYEK
+ABED ; Meetei_Mayek # Mn MEETEI MAYEK APUN IYEK
+ABF0..ABF9 ; Meetei_Mayek # Nd [10] MEETEI MAYEK DIGIT ZERO..MEETEI MAYEK DIGIT NINE
+
+# Total code points: 79
+
+# ================================================
+
+10840..10855 ; Imperial_Aramaic # Lo [22] IMPERIAL ARAMAIC LETTER ALEPH..IMPERIAL ARAMAIC LETTER TAW
+10857 ; Imperial_Aramaic # Po IMPERIAL ARAMAIC SECTION SIGN
+10858..1085F ; Imperial_Aramaic # No [8] IMPERIAL ARAMAIC NUMBER ONE..IMPERIAL ARAMAIC NUMBER TEN THOUSAND
+
+# Total code points: 31
+
+# ================================================
+
+10A60..10A7C ; Old_South_Arabian # Lo [29] OLD SOUTH ARABIAN LETTER HE..OLD SOUTH ARABIAN LETTER THETH
+10A7D..10A7E ; Old_South_Arabian # No [2] OLD SOUTH ARABIAN NUMBER ONE..OLD SOUTH ARABIAN NUMBER FIFTY
+10A7F ; Old_South_Arabian # Po OLD SOUTH ARABIAN NUMERIC INDICATOR
+
+# Total code points: 32
+
+# ================================================
+
+10B40..10B55 ; Inscriptional_Parthian # Lo [22] INSCRIPTIONAL PARTHIAN LETTER ALEPH..INSCRIPTIONAL PARTHIAN LETTER TAW
+10B58..10B5F ; Inscriptional_Parthian # No [8] INSCRIPTIONAL PARTHIAN NUMBER ONE..INSCRIPTIONAL PARTHIAN NUMBER ONE THOUSAND
+
+# Total code points: 30
+
+# ================================================
+
+10B60..10B72 ; Inscriptional_Pahlavi # Lo [19] INSCRIPTIONAL PAHLAVI LETTER ALEPH..INSCRIPTIONAL PAHLAVI LETTER TAW
+10B78..10B7F ; Inscriptional_Pahlavi # No [8] INSCRIPTIONAL PAHLAVI NUMBER ONE..INSCRIPTIONAL PAHLAVI NUMBER ONE THOUSAND
+
+# Total code points: 27
+
+# ================================================
+
+10C00..10C48 ; Old_Turkic # Lo [73] OLD TURKIC LETTER ORKHON A..OLD TURKIC LETTER ORKHON BASH
+
+# Total code points: 73
+
+# ================================================
+
+11080..11081 ; Kaithi # Mn [2] KAITHI SIGN CANDRABINDU..KAITHI SIGN ANUSVARA
+11082 ; Kaithi # Mc KAITHI SIGN VISARGA
+11083..110AF ; Kaithi # Lo [45] KAITHI LETTER A..KAITHI LETTER HA
+110B0..110B2 ; Kaithi # Mc [3] KAITHI VOWEL SIGN AA..KAITHI VOWEL SIGN II
+110B3..110B6 ; Kaithi # Mn [4] KAITHI VOWEL SIGN U..KAITHI VOWEL SIGN AI
+110B7..110B8 ; Kaithi # Mc [2] KAITHI VOWEL SIGN O..KAITHI VOWEL SIGN AU
+110B9..110BA ; Kaithi # Mn [2] KAITHI SIGN VIRAMA..KAITHI SIGN NUKTA
+110BB..110BC ; Kaithi # Po [2] KAITHI ABBREVIATION SIGN..KAITHI ENUMERATION SIGN
+110BD ; Kaithi # Cf KAITHI NUMBER SIGN
+110BE..110C1 ; Kaithi # Po [4] KAITHI SECTION MARK..KAITHI DOUBLE DANDA
+110C2 ; Kaithi # Mn KAITHI VOWEL SIGN VOCALIC R
+110CD ; Kaithi # Cf KAITHI NUMBER SIGN ABOVE
+
+# Total code points: 68
+
+# ================================================
+
+1BC0..1BE5 ; Batak # Lo [38] BATAK LETTER A..BATAK LETTER U
+1BE6 ; Batak # Mn BATAK SIGN TOMPI
+1BE7 ; Batak # Mc BATAK VOWEL SIGN E
+1BE8..1BE9 ; Batak # Mn [2] BATAK VOWEL SIGN PAKPAK E..BATAK VOWEL SIGN EE
+1BEA..1BEC ; Batak # Mc [3] BATAK VOWEL SIGN I..BATAK VOWEL SIGN O
+1BED ; Batak # Mn BATAK VOWEL SIGN KARO O
+1BEE ; Batak # Mc BATAK VOWEL SIGN U
+1BEF..1BF1 ; Batak # Mn [3] BATAK VOWEL SIGN U FOR SIMALUNGUN SA..BATAK CONSONANT SIGN H
+1BF2..1BF3 ; Batak # Mc [2] BATAK PANGOLAT..BATAK PANONGONAN
+1BFC..1BFF ; Batak # Po [4] BATAK SYMBOL BINDU NA METEK..BATAK SYMBOL BINDU PANGOLAT
+
+# Total code points: 56
+
+# ================================================
+
+11000 ; Brahmi # Mc BRAHMI SIGN CANDRABINDU
+11001 ; Brahmi # Mn BRAHMI SIGN ANUSVARA
+11002 ; Brahmi # Mc BRAHMI SIGN VISARGA
+11003..11037 ; Brahmi # Lo [53] BRAHMI SIGN JIHVAMULIYA..BRAHMI LETTER OLD TAMIL NNNA
+11038..11046 ; Brahmi # Mn [15] BRAHMI VOWEL SIGN AA..BRAHMI VIRAMA
+11047..1104D ; Brahmi # Po [7] BRAHMI DANDA..BRAHMI PUNCTUATION LOTUS
+11052..11065 ; Brahmi # No [20] BRAHMI NUMBER ONE..BRAHMI NUMBER ONE THOUSAND
+11066..1106F ; Brahmi # Nd [10] BRAHMI DIGIT ZERO..BRAHMI DIGIT NINE
+11070 ; Brahmi # Mn BRAHMI SIGN OLD TAMIL VIRAMA
+11071..11072 ; Brahmi # Lo [2] BRAHMI LETTER OLD TAMIL SHORT E..BRAHMI LETTER OLD TAMIL SHORT O
+11073..11074 ; Brahmi # Mn [2] BRAHMI VOWEL SIGN OLD TAMIL SHORT E..BRAHMI VOWEL SIGN OLD TAMIL SHORT O
+11075 ; Brahmi # Lo BRAHMI LETTER OLD TAMIL LLA
+1107F ; Brahmi # Mn BRAHMI NUMBER JOINER
+
+# Total code points: 115
+
+# ================================================
+
+0840..0858 ; Mandaic # Lo [25] MANDAIC LETTER HALQA..MANDAIC LETTER AIN
+0859..085B ; Mandaic # Mn [3] MANDAIC AFFRICATION MARK..MANDAIC GEMINATION MARK
+085E ; Mandaic # Po MANDAIC PUNCTUATION
+
+# Total code points: 29
+
+# ================================================
+
+11100..11102 ; Chakma # Mn [3] CHAKMA SIGN CANDRABINDU..CHAKMA SIGN VISARGA
+11103..11126 ; Chakma # Lo [36] CHAKMA LETTER AA..CHAKMA LETTER HAA
+11127..1112B ; Chakma # Mn [5] CHAKMA VOWEL SIGN A..CHAKMA VOWEL SIGN UU
+1112C ; Chakma # Mc CHAKMA VOWEL SIGN E
+1112D..11134 ; Chakma # Mn [8] CHAKMA VOWEL SIGN AI..CHAKMA MAAYYAA
+11136..1113F ; Chakma # Nd [10] CHAKMA DIGIT ZERO..CHAKMA DIGIT NINE
+11140..11143 ; Chakma # Po [4] CHAKMA SECTION MARK..CHAKMA QUESTION MARK
+11144 ; Chakma # Lo CHAKMA LETTER LHAA
+11145..11146 ; Chakma # Mc [2] CHAKMA VOWEL SIGN AA..CHAKMA VOWEL SIGN EI
+11147 ; Chakma # Lo CHAKMA LETTER VAA
+
+# Total code points: 71
+
+# ================================================
+
+109A0..109B7 ; Meroitic_Cursive # Lo [24] MEROITIC CURSIVE LETTER A..MEROITIC CURSIVE LETTER DA
+109BC..109BD ; Meroitic_Cursive # No [2] MEROITIC CURSIVE FRACTION ELEVEN TWELFTHS..MEROITIC CURSIVE FRACTION ONE HALF
+109BE..109BF ; Meroitic_Cursive # Lo [2] MEROITIC CURSIVE LOGOGRAM RMT..MEROITIC CURSIVE LOGOGRAM IMN
+109C0..109CF ; Meroitic_Cursive # No [16] MEROITIC CURSIVE NUMBER ONE..MEROITIC CURSIVE NUMBER SEVENTY
+109D2..109FF ; Meroitic_Cursive # No [46] MEROITIC CURSIVE NUMBER ONE HUNDRED..MEROITIC CURSIVE FRACTION TEN TWELFTHS
+
+# Total code points: 90
+
+# ================================================
+
+10980..1099F ; Meroitic_Hieroglyphs # Lo [32] MEROITIC HIEROGLYPHIC LETTER A..MEROITIC HIEROGLYPHIC SYMBOL VIDJ-2
+
+# Total code points: 32
+
+# ================================================
+
+16F00..16F4A ; Miao # Lo [75] MIAO LETTER PA..MIAO LETTER RTE
+16F4F ; Miao # Mn MIAO SIGN CONSONANT MODIFIER BAR
+16F50 ; Miao # Lo MIAO LETTER NASALIZATION
+16F51..16F87 ; Miao # Mc [55] MIAO SIGN ASPIRATION..MIAO VOWEL SIGN UI
+16F8F..16F92 ; Miao # Mn [4] MIAO TONE RIGHT..MIAO TONE BELOW
+16F93..16F9F ; Miao # Lm [13] MIAO LETTER TONE-2..MIAO LETTER REFORMED TONE-8
+
+# Total code points: 149
+
+# ================================================
+
+11180..11181 ; Sharada # Mn [2] SHARADA SIGN CANDRABINDU..SHARADA SIGN ANUSVARA
+11182 ; Sharada # Mc SHARADA SIGN VISARGA
+11183..111B2 ; Sharada # Lo [48] SHARADA LETTER A..SHARADA LETTER HA
+111B3..111B5 ; Sharada # Mc [3] SHARADA VOWEL SIGN AA..SHARADA VOWEL SIGN II
+111B6..111BE ; Sharada # Mn [9] SHARADA VOWEL SIGN U..SHARADA VOWEL SIGN O
+111BF..111C0 ; Sharada # Mc [2] SHARADA VOWEL SIGN AU..SHARADA SIGN VIRAMA
+111C1..111C4 ; Sharada # Lo [4] SHARADA SIGN AVAGRAHA..SHARADA OM
+111C5..111C8 ; Sharada # Po [4] SHARADA DANDA..SHARADA SEPARATOR
+111C9..111CC ; Sharada # Mn [4] SHARADA SANDHI MARK..SHARADA EXTRA SHORT VOWEL MARK
+111CD ; Sharada # Po SHARADA SUTRA MARK
+111CE ; Sharada # Mc SHARADA VOWEL SIGN PRISHTHAMATRA E
+111CF ; Sharada # Mn SHARADA SIGN INVERTED CANDRABINDU
+111D0..111D9 ; Sharada # Nd [10] SHARADA DIGIT ZERO..SHARADA DIGIT NINE
+111DA ; Sharada # Lo SHARADA EKAM
+111DB ; Sharada # Po SHARADA SIGN SIDDHAM
+111DC ; Sharada # Lo SHARADA HEADSTROKE
+111DD..111DF ; Sharada # Po [3] SHARADA CONTINUATION SIGN..SHARADA SECTION MARK-2
+
+# Total code points: 96
+
+# ================================================
+
+110D0..110E8 ; Sora_Sompeng # Lo [25] SORA SOMPENG LETTER SAH..SORA SOMPENG LETTER MAE
+110F0..110F9 ; Sora_Sompeng # Nd [10] SORA SOMPENG DIGIT ZERO..SORA SOMPENG DIGIT NINE
+
+# Total code points: 35
+
+# ================================================
+
+11680..116AA ; Takri # Lo [43] TAKRI LETTER A..TAKRI LETTER RRA
+116AB ; Takri # Mn TAKRI SIGN ANUSVARA
+116AC ; Takri # Mc TAKRI SIGN VISARGA
+116AD ; Takri # Mn TAKRI VOWEL SIGN AA
+116AE..116AF ; Takri # Mc [2] TAKRI VOWEL SIGN I..TAKRI VOWEL SIGN II
+116B0..116B5 ; Takri # Mn [6] TAKRI VOWEL SIGN U..TAKRI VOWEL SIGN AU
+116B6 ; Takri # Mc TAKRI SIGN VIRAMA
+116B7 ; Takri # Mn TAKRI SIGN NUKTA
+116B8 ; Takri # Lo TAKRI LETTER ARCHAIC KHA
+116B9 ; Takri # Po TAKRI ABBREVIATION SIGN
+116C0..116C9 ; Takri # Nd [10] TAKRI DIGIT ZERO..TAKRI DIGIT NINE
+
+# Total code points: 68
+
+# ================================================
+
+10530..10563 ; Caucasian_Albanian # Lo [52] CAUCASIAN ALBANIAN LETTER ALT..CAUCASIAN ALBANIAN LETTER KIW
+1056F ; Caucasian_Albanian # Po CAUCASIAN ALBANIAN CITATION MARK
+
+# Total code points: 53
+
+# ================================================
+
+16AD0..16AED ; Bassa_Vah # Lo [30] BASSA VAH LETTER ENNI..BASSA VAH LETTER I
+16AF0..16AF4 ; Bassa_Vah # Mn [5] BASSA VAH COMBINING HIGH TONE..BASSA VAH COMBINING HIGH-LOW TONE
+16AF5 ; Bassa_Vah # Po BASSA VAH FULL STOP
+
+# Total code points: 36
+
+# ================================================
+
+1BC00..1BC6A ; Duployan # Lo [107] DUPLOYAN LETTER H..DUPLOYAN LETTER VOCALIC M
+1BC70..1BC7C ; Duployan # Lo [13] DUPLOYAN AFFIX LEFT HORIZONTAL SECANT..DUPLOYAN AFFIX ATTACHED TANGENT HOOK
+1BC80..1BC88 ; Duployan # Lo [9] DUPLOYAN AFFIX HIGH ACUTE..DUPLOYAN AFFIX HIGH VERTICAL
+1BC90..1BC99 ; Duployan # Lo [10] DUPLOYAN AFFIX LOW ACUTE..DUPLOYAN AFFIX LOW ARROW
+1BC9C ; Duployan # So DUPLOYAN SIGN O WITH CROSS
+1BC9D..1BC9E ; Duployan # Mn [2] DUPLOYAN THICK LETTER SELECTOR..DUPLOYAN DOUBLE MARK
+1BC9F ; Duployan # Po DUPLOYAN PUNCTUATION CHINOOK FULL STOP
+
+# Total code points: 143
+
+# ================================================
+
+10500..10527 ; Elbasan # Lo [40] ELBASAN LETTER A..ELBASAN LETTER KHE
+
+# Total code points: 40
+
+# ================================================
+
+11300..11301 ; Grantha # Mn [2] GRANTHA SIGN COMBINING ANUSVARA ABOVE..GRANTHA SIGN CANDRABINDU
+11302..11303 ; Grantha # Mc [2] GRANTHA SIGN ANUSVARA..GRANTHA SIGN VISARGA
+11305..1130C ; Grantha # Lo [8] GRANTHA LETTER A..GRANTHA LETTER VOCALIC L
+1130F..11310 ; Grantha # Lo [2] GRANTHA LETTER EE..GRANTHA LETTER AI
+11313..11328 ; Grantha # Lo [22] GRANTHA LETTER OO..GRANTHA LETTER NA
+1132A..11330 ; Grantha # Lo [7] GRANTHA LETTER PA..GRANTHA LETTER RA
+11332..11333 ; Grantha # Lo [2] GRANTHA LETTER LA..GRANTHA LETTER LLA
+11335..11339 ; Grantha # Lo [5] GRANTHA LETTER VA..GRANTHA LETTER HA
+1133C ; Grantha # Mn GRANTHA SIGN NUKTA
+1133D ; Grantha # Lo GRANTHA SIGN AVAGRAHA
+1133E..1133F ; Grantha # Mc [2] GRANTHA VOWEL SIGN AA..GRANTHA VOWEL SIGN I
+11340 ; Grantha # Mn GRANTHA VOWEL SIGN II
+11341..11344 ; Grantha # Mc [4] GRANTHA VOWEL SIGN U..GRANTHA VOWEL SIGN VOCALIC RR
+11347..11348 ; Grantha # Mc [2] GRANTHA VOWEL SIGN EE..GRANTHA VOWEL SIGN AI
+1134B..1134D ; Grantha # Mc [3] GRANTHA VOWEL SIGN OO..GRANTHA SIGN VIRAMA
+11350 ; Grantha # Lo GRANTHA OM
+11357 ; Grantha # Mc GRANTHA AU LENGTH MARK
+1135D..11361 ; Grantha # Lo [5] GRANTHA SIGN PLUTA..GRANTHA LETTER VOCALIC LL
+11362..11363 ; Grantha # Mc [2] GRANTHA VOWEL SIGN VOCALIC L..GRANTHA VOWEL SIGN VOCALIC LL
+11366..1136C ; Grantha # Mn [7] COMBINING GRANTHA DIGIT ZERO..COMBINING GRANTHA DIGIT SIX
+11370..11374 ; Grantha # Mn [5] COMBINING GRANTHA LETTER A..COMBINING GRANTHA LETTER PA
+
+# Total code points: 85
+
+# ================================================
+
+16B00..16B2F ; Pahawh_Hmong # Lo [48] PAHAWH HMONG VOWEL KEEB..PAHAWH HMONG CONSONANT CAU
+16B30..16B36 ; Pahawh_Hmong # Mn [7] PAHAWH HMONG MARK CIM TUB..PAHAWH HMONG MARK CIM TAUM
+16B37..16B3B ; Pahawh_Hmong # Po [5] PAHAWH HMONG SIGN VOS THOM..PAHAWH HMONG SIGN VOS FEEM
+16B3C..16B3F ; Pahawh_Hmong # So [4] PAHAWH HMONG SIGN XYEEM NTXIV..PAHAWH HMONG SIGN XYEEM FAIB
+16B40..16B43 ; Pahawh_Hmong # Lm [4] PAHAWH HMONG SIGN VOS SEEV..PAHAWH HMONG SIGN IB YAM
+16B44 ; Pahawh_Hmong # Po PAHAWH HMONG SIGN XAUS
+16B45 ; Pahawh_Hmong # So PAHAWH HMONG SIGN CIM TSOV ROG
+16B50..16B59 ; Pahawh_Hmong # Nd [10] PAHAWH HMONG DIGIT ZERO..PAHAWH HMONG DIGIT NINE
+16B5B..16B61 ; Pahawh_Hmong # No [7] PAHAWH HMONG NUMBER TENS..PAHAWH HMONG NUMBER TRILLIONS
+16B63..16B77 ; Pahawh_Hmong # Lo [21] PAHAWH HMONG SIGN VOS LUB..PAHAWH HMONG SIGN CIM NRES TOS
+16B7D..16B8F ; Pahawh_Hmong # Lo [19] PAHAWH HMONG CLAN SIGN TSHEEJ..PAHAWH HMONG CLAN SIGN VWJ
+
+# Total code points: 127
+
+# ================================================
+
+11200..11211 ; Khojki # Lo [18] KHOJKI LETTER A..KHOJKI LETTER JJA
+11213..1122B ; Khojki # Lo [25] KHOJKI LETTER NYA..KHOJKI LETTER LLA
+1122C..1122E ; Khojki # Mc [3] KHOJKI VOWEL SIGN AA..KHOJKI VOWEL SIGN II
+1122F..11231 ; Khojki # Mn [3] KHOJKI VOWEL SIGN U..KHOJKI VOWEL SIGN AI
+11232..11233 ; Khojki # Mc [2] KHOJKI VOWEL SIGN O..KHOJKI VOWEL SIGN AU
+11234 ; Khojki # Mn KHOJKI SIGN ANUSVARA
+11235 ; Khojki # Mc KHOJKI SIGN VIRAMA
+11236..11237 ; Khojki # Mn [2] KHOJKI SIGN NUKTA..KHOJKI SIGN SHADDA
+11238..1123D ; Khojki # Po [6] KHOJKI DANDA..KHOJKI ABBREVIATION SIGN
+1123E ; Khojki # Mn KHOJKI SIGN SUKUN
+1123F..11240 ; Khojki # Lo [2] KHOJKI LETTER QA..KHOJKI LETTER SHORT I
+11241 ; Khojki # Mn KHOJKI VOWEL SIGN VOCALIC R
+
+# Total code points: 65
+
+# ================================================
+
+10600..10736 ; Linear_A # Lo [311] LINEAR A SIGN AB001..LINEAR A SIGN A664
+10740..10755 ; Linear_A # Lo [22] LINEAR A SIGN A701 A..LINEAR A SIGN A732 JE
+10760..10767 ; Linear_A # Lo [8] LINEAR A SIGN A800..LINEAR A SIGN A807
+
+# Total code points: 341
+
+# ================================================
+
+11150..11172 ; Mahajani # Lo [35] MAHAJANI LETTER A..MAHAJANI LETTER RRA
+11173 ; Mahajani # Mn MAHAJANI SIGN NUKTA
+11174..11175 ; Mahajani # Po [2] MAHAJANI ABBREVIATION SIGN..MAHAJANI SECTION MARK
+11176 ; Mahajani # Lo MAHAJANI LIGATURE SHRI
+
+# Total code points: 39
+
+# ================================================
+
+10AC0..10AC7 ; Manichaean # Lo [8] MANICHAEAN LETTER ALEPH..MANICHAEAN LETTER WAW
+10AC8 ; Manichaean # So MANICHAEAN SIGN UD
+10AC9..10AE4 ; Manichaean # Lo [28] MANICHAEAN LETTER ZAYIN..MANICHAEAN LETTER TAW
+10AE5..10AE6 ; Manichaean # Mn [2] MANICHAEAN ABBREVIATION MARK ABOVE..MANICHAEAN ABBREVIATION MARK BELOW
+10AEB..10AEF ; Manichaean # No [5] MANICHAEAN NUMBER ONE..MANICHAEAN NUMBER ONE HUNDRED
+10AF0..10AF6 ; Manichaean # Po [7] MANICHAEAN PUNCTUATION STAR..MANICHAEAN PUNCTUATION LINE FILLER
+
+# Total code points: 51
+
+# ================================================
+
+1E800..1E8C4 ; Mende_Kikakui # Lo [197] MENDE KIKAKUI SYLLABLE M001 KI..MENDE KIKAKUI SYLLABLE M060 NYON
+1E8C7..1E8CF ; Mende_Kikakui # No [9] MENDE KIKAKUI DIGIT ONE..MENDE KIKAKUI DIGIT NINE
+1E8D0..1E8D6 ; Mende_Kikakui # Mn [7] MENDE KIKAKUI COMBINING NUMBER TEENS..MENDE KIKAKUI COMBINING NUMBER MILLIONS
+
+# Total code points: 213
+
+# ================================================
+
+11600..1162F ; Modi # Lo [48] MODI LETTER A..MODI LETTER LLA
+11630..11632 ; Modi # Mc [3] MODI VOWEL SIGN AA..MODI VOWEL SIGN II
+11633..1163A ; Modi # Mn [8] MODI VOWEL SIGN U..MODI VOWEL SIGN AI
+1163B..1163C ; Modi # Mc [2] MODI VOWEL SIGN O..MODI VOWEL SIGN AU
+1163D ; Modi # Mn MODI SIGN ANUSVARA
+1163E ; Modi # Mc MODI SIGN VISARGA
+1163F..11640 ; Modi # Mn [2] MODI SIGN VIRAMA..MODI SIGN ARDHACANDRA
+11641..11643 ; Modi # Po [3] MODI DANDA..MODI ABBREVIATION SIGN
+11644 ; Modi # Lo MODI SIGN HUVA
+11650..11659 ; Modi # Nd [10] MODI DIGIT ZERO..MODI DIGIT NINE
+
+# Total code points: 79
+
+# ================================================
+
+16A40..16A5E ; Mro # Lo [31] MRO LETTER TA..MRO LETTER TEK
+16A60..16A69 ; Mro # Nd [10] MRO DIGIT ZERO..MRO DIGIT NINE
+16A6E..16A6F ; Mro # Po [2] MRO DANDA..MRO DOUBLE DANDA
+
+# Total code points: 43
+
+# ================================================
+
+10A80..10A9C ; Old_North_Arabian # Lo [29] OLD NORTH ARABIAN LETTER HEH..OLD NORTH ARABIAN LETTER ZAH
+10A9D..10A9F ; Old_North_Arabian # No [3] OLD NORTH ARABIAN NUMBER ONE..OLD NORTH ARABIAN NUMBER TWENTY
+
+# Total code points: 32
+
+# ================================================
+
+10880..1089E ; Nabataean # Lo [31] NABATAEAN LETTER FINAL ALEPH..NABATAEAN LETTER TAW
+108A7..108AF ; Nabataean # No [9] NABATAEAN NUMBER ONE..NABATAEAN NUMBER ONE HUNDRED
+
+# Total code points: 40
+
+# ================================================
+
+10860..10876 ; Palmyrene # Lo [23] PALMYRENE LETTER ALEPH..PALMYRENE LETTER TAW
+10877..10878 ; Palmyrene # So [2] PALMYRENE LEFT-POINTING FLEURON..PALMYRENE RIGHT-POINTING FLEURON
+10879..1087F ; Palmyrene # No [7] PALMYRENE NUMBER ONE..PALMYRENE NUMBER TWENTY
+
+# Total code points: 32
+
+# ================================================
+
+11AC0..11AF8 ; Pau_Cin_Hau # Lo [57] PAU CIN HAU LETTER PA..PAU CIN HAU GLOTTAL STOP FINAL
+
+# Total code points: 57
+
+# ================================================
+
+10350..10375 ; Old_Permic # Lo [38] OLD PERMIC LETTER AN..OLD PERMIC LETTER IA
+10376..1037A ; Old_Permic # Mn [5] COMBINING OLD PERMIC LETTER AN..COMBINING OLD PERMIC LETTER SII
+
+# Total code points: 43
+
+# ================================================
+
+10B80..10B91 ; Psalter_Pahlavi # Lo [18] PSALTER PAHLAVI LETTER ALEPH..PSALTER PAHLAVI LETTER TAW
+10B99..10B9C ; Psalter_Pahlavi # Po [4] PSALTER PAHLAVI SECTION MARK..PSALTER PAHLAVI FOUR DOTS WITH DOT
+10BA9..10BAF ; Psalter_Pahlavi # No [7] PSALTER PAHLAVI NUMBER ONE..PSALTER PAHLAVI NUMBER ONE HUNDRED
+
+# Total code points: 29
+
+# ================================================
+
+11580..115AE ; Siddham # Lo [47] SIDDHAM LETTER A..SIDDHAM LETTER HA
+115AF..115B1 ; Siddham # Mc [3] SIDDHAM VOWEL SIGN AA..SIDDHAM VOWEL SIGN II
+115B2..115B5 ; Siddham # Mn [4] SIDDHAM VOWEL SIGN U..SIDDHAM VOWEL SIGN VOCALIC RR
+115B8..115BB ; Siddham # Mc [4] SIDDHAM VOWEL SIGN E..SIDDHAM VOWEL SIGN AU
+115BC..115BD ; Siddham # Mn [2] SIDDHAM SIGN CANDRABINDU..SIDDHAM SIGN ANUSVARA
+115BE ; Siddham # Mc SIDDHAM SIGN VISARGA
+115BF..115C0 ; Siddham # Mn [2] SIDDHAM SIGN VIRAMA..SIDDHAM SIGN NUKTA
+115C1..115D7 ; Siddham # Po [23] SIDDHAM SIGN SIDDHAM..SIDDHAM SECTION MARK WITH CIRCLES AND FOUR ENCLOSURES
+115D8..115DB ; Siddham # Lo [4] SIDDHAM LETTER THREE-CIRCLE ALTERNATE I..SIDDHAM LETTER ALTERNATE U
+115DC..115DD ; Siddham # Mn [2] SIDDHAM VOWEL SIGN ALTERNATE U..SIDDHAM VOWEL SIGN ALTERNATE UU
+
+# Total code points: 92
+
+# ================================================
+
+112B0..112DE ; Khudawadi # Lo [47] KHUDAWADI LETTER A..KHUDAWADI LETTER HA
+112DF ; Khudawadi # Mn KHUDAWADI SIGN ANUSVARA
+112E0..112E2 ; Khudawadi # Mc [3] KHUDAWADI VOWEL SIGN AA..KHUDAWADI VOWEL SIGN II
+112E3..112EA ; Khudawadi # Mn [8] KHUDAWADI VOWEL SIGN U..KHUDAWADI SIGN VIRAMA
+112F0..112F9 ; Khudawadi # Nd [10] KHUDAWADI DIGIT ZERO..KHUDAWADI DIGIT NINE
+
+# Total code points: 69
+
+# ================================================
+
+11480..114AF ; Tirhuta # Lo [48] TIRHUTA ANJI..TIRHUTA LETTER HA
+114B0..114B2 ; Tirhuta # Mc [3] TIRHUTA VOWEL SIGN AA..TIRHUTA VOWEL SIGN II
+114B3..114B8 ; Tirhuta # Mn [6] TIRHUTA VOWEL SIGN U..TIRHUTA VOWEL SIGN VOCALIC LL
+114B9 ; Tirhuta # Mc TIRHUTA VOWEL SIGN E
+114BA ; Tirhuta # Mn TIRHUTA VOWEL SIGN SHORT E
+114BB..114BE ; Tirhuta # Mc [4] TIRHUTA VOWEL SIGN AI..TIRHUTA VOWEL SIGN AU
+114BF..114C0 ; Tirhuta # Mn [2] TIRHUTA SIGN CANDRABINDU..TIRHUTA SIGN ANUSVARA
+114C1 ; Tirhuta # Mc TIRHUTA SIGN VISARGA
+114C2..114C3 ; Tirhuta # Mn [2] TIRHUTA SIGN VIRAMA..TIRHUTA SIGN NUKTA
+114C4..114C5 ; Tirhuta # Lo [2] TIRHUTA SIGN AVAGRAHA..TIRHUTA GVANG
+114C6 ; Tirhuta # Po TIRHUTA ABBREVIATION SIGN
+114C7 ; Tirhuta # Lo TIRHUTA OM
+114D0..114D9 ; Tirhuta # Nd [10] TIRHUTA DIGIT ZERO..TIRHUTA DIGIT NINE
+
+# Total code points: 82
+
+# ================================================
+
+118A0..118DF ; Warang_Citi # L& [64] WARANG CITI CAPITAL LETTER NGAA..WARANG CITI SMALL LETTER VIYO
+118E0..118E9 ; Warang_Citi # Nd [10] WARANG CITI DIGIT ZERO..WARANG CITI DIGIT NINE
+118EA..118F2 ; Warang_Citi # No [9] WARANG CITI NUMBER TEN..WARANG CITI NUMBER NINETY
+118FF ; Warang_Citi # Lo WARANG CITI OM
+
+# Total code points: 84
+
+# ================================================
+
+11700..1171A ; Ahom # Lo [27] AHOM LETTER KA..AHOM LETTER ALTERNATE BA
+1171D..1171F ; Ahom # Mn [3] AHOM CONSONANT SIGN MEDIAL LA..AHOM CONSONANT SIGN MEDIAL LIGATING RA
+11720..11721 ; Ahom # Mc [2] AHOM VOWEL SIGN A..AHOM VOWEL SIGN AA
+11722..11725 ; Ahom # Mn [4] AHOM VOWEL SIGN I..AHOM VOWEL SIGN UU
+11726 ; Ahom # Mc AHOM VOWEL SIGN E
+11727..1172B ; Ahom # Mn [5] AHOM VOWEL SIGN AW..AHOM SIGN KILLER
+11730..11739 ; Ahom # Nd [10] AHOM DIGIT ZERO..AHOM DIGIT NINE
+1173A..1173B ; Ahom # No [2] AHOM NUMBER TEN..AHOM NUMBER TWENTY
+1173C..1173E ; Ahom # Po [3] AHOM SIGN SMALL SECTION..AHOM SIGN RULAI
+1173F ; Ahom # So AHOM SYMBOL VI
+11740..11746 ; Ahom # Lo [7] AHOM LETTER CA..AHOM LETTER LLA
+
+# Total code points: 65
+
+# ================================================
+
+14400..14646 ; Anatolian_Hieroglyphs # Lo [583] ANATOLIAN HIEROGLYPH A001..ANATOLIAN HIEROGLYPH A530
+
+# Total code points: 583
+
+# ================================================
+
+108E0..108F2 ; Hatran # Lo [19] HATRAN LETTER ALEPH..HATRAN LETTER QOPH
+108F4..108F5 ; Hatran # Lo [2] HATRAN LETTER SHIN..HATRAN LETTER TAW
+108FB..108FF ; Hatran # No [5] HATRAN NUMBER ONE..HATRAN NUMBER ONE HUNDRED
+
+# Total code points: 26
+
+# ================================================
+
+11280..11286 ; Multani # Lo [7] MULTANI LETTER A..MULTANI LETTER GA
+11288 ; Multani # Lo MULTANI LETTER GHA
+1128A..1128D ; Multani # Lo [4] MULTANI LETTER CA..MULTANI LETTER JJA
+1128F..1129D ; Multani # Lo [15] MULTANI LETTER NYA..MULTANI LETTER BA
+1129F..112A8 ; Multani # Lo [10] MULTANI LETTER BHA..MULTANI LETTER RHA
+112A9 ; Multani # Po MULTANI SECTION MARK
+
+# Total code points: 38
+
+# ================================================
+
+10C80..10CB2 ; Old_Hungarian # L& [51] OLD HUNGARIAN CAPITAL LETTER A..OLD HUNGARIAN CAPITAL LETTER US
+10CC0..10CF2 ; Old_Hungarian # L& [51] OLD HUNGARIAN SMALL LETTER A..OLD HUNGARIAN SMALL LETTER US
+10CFA..10CFF ; Old_Hungarian # No [6] OLD HUNGARIAN NUMBER ONE..OLD HUNGARIAN NUMBER ONE THOUSAND
+
+# Total code points: 108
+
+# ================================================
+
+1D800..1D9FF ; SignWriting # So [512] SIGNWRITING HAND-FIST INDEX..SIGNWRITING HEAD
+1DA00..1DA36 ; SignWriting # Mn [55] SIGNWRITING HEAD RIM..SIGNWRITING AIR SUCKING IN
+1DA37..1DA3A ; SignWriting # So [4] SIGNWRITING AIR BLOW SMALL ROTATIONS..SIGNWRITING BREATH EXHALE
+1DA3B..1DA6C ; SignWriting # Mn [50] SIGNWRITING MOUTH CLOSED NEUTRAL..SIGNWRITING EXCITEMENT
+1DA6D..1DA74 ; SignWriting # So [8] SIGNWRITING SHOULDER HIP SPINE..SIGNWRITING TORSO-FLOORPLANE TWISTING
+1DA75 ; SignWriting # Mn SIGNWRITING UPPER BODY TILTING FROM HIP JOINTS
+1DA76..1DA83 ; SignWriting # So [14] SIGNWRITING LIMB COMBINATION..SIGNWRITING LOCATION DEPTH
+1DA84 ; SignWriting # Mn SIGNWRITING LOCATION HEAD NECK
+1DA85..1DA86 ; SignWriting # So [2] SIGNWRITING LOCATION TORSO..SIGNWRITING LOCATION LIMBS DIGITS
+1DA87..1DA8B ; SignWriting # Po [5] SIGNWRITING COMMA..SIGNWRITING PARENTHESIS
+1DA9B..1DA9F ; SignWriting # Mn [5] SIGNWRITING FILL MODIFIER-2..SIGNWRITING FILL MODIFIER-6
+1DAA1..1DAAF ; SignWriting # Mn [15] SIGNWRITING ROTATION MODIFIER-2..SIGNWRITING ROTATION MODIFIER-16
+
+# Total code points: 672
+
+# ================================================
+
+1E900..1E943 ; Adlam # L& [68] ADLAM CAPITAL LETTER ALIF..ADLAM SMALL LETTER SHA
+1E944..1E94A ; Adlam # Mn [7] ADLAM ALIF LENGTHENER..ADLAM NUKTA
+1E94B ; Adlam # Lm ADLAM NASALIZATION MARK
+1E950..1E959 ; Adlam # Nd [10] ADLAM DIGIT ZERO..ADLAM DIGIT NINE
+1E95E..1E95F ; Adlam # Po [2] ADLAM INITIAL EXCLAMATION MARK..ADLAM INITIAL QUESTION MARK
+
+# Total code points: 88
+
+# ================================================
+
+11C00..11C08 ; Bhaiksuki # Lo [9] BHAIKSUKI LETTER A..BHAIKSUKI LETTER VOCALIC L
+11C0A..11C2E ; Bhaiksuki # Lo [37] BHAIKSUKI LETTER E..BHAIKSUKI LETTER HA
+11C2F ; Bhaiksuki # Mc BHAIKSUKI VOWEL SIGN AA
+11C30..11C36 ; Bhaiksuki # Mn [7] BHAIKSUKI VOWEL SIGN I..BHAIKSUKI VOWEL SIGN VOCALIC L
+11C38..11C3D ; Bhaiksuki # Mn [6] BHAIKSUKI VOWEL SIGN E..BHAIKSUKI SIGN ANUSVARA
+11C3E ; Bhaiksuki # Mc BHAIKSUKI SIGN VISARGA
+11C3F ; Bhaiksuki # Mn BHAIKSUKI SIGN VIRAMA
+11C40 ; Bhaiksuki # Lo BHAIKSUKI SIGN AVAGRAHA
+11C41..11C45 ; Bhaiksuki # Po [5] BHAIKSUKI DANDA..BHAIKSUKI GAP FILLER-2
+11C50..11C59 ; Bhaiksuki # Nd [10] BHAIKSUKI DIGIT ZERO..BHAIKSUKI DIGIT NINE
+11C5A..11C6C ; Bhaiksuki # No [19] BHAIKSUKI NUMBER ONE..BHAIKSUKI HUNDREDS UNIT MARK
+
+# Total code points: 97
+
+# ================================================
+
+11C70..11C71 ; Marchen # Po [2] MARCHEN HEAD MARK..MARCHEN MARK SHAD
+11C72..11C8F ; Marchen # Lo [30] MARCHEN LETTER KA..MARCHEN LETTER A
+11C92..11CA7 ; Marchen # Mn [22] MARCHEN SUBJOINED LETTER KA..MARCHEN SUBJOINED LETTER ZA
+11CA9 ; Marchen # Mc MARCHEN SUBJOINED LETTER YA
+11CAA..11CB0 ; Marchen # Mn [7] MARCHEN SUBJOINED LETTER RA..MARCHEN VOWEL SIGN AA
+11CB1 ; Marchen # Mc MARCHEN VOWEL SIGN I
+11CB2..11CB3 ; Marchen # Mn [2] MARCHEN VOWEL SIGN U..MARCHEN VOWEL SIGN E
+11CB4 ; Marchen # Mc MARCHEN VOWEL SIGN O
+11CB5..11CB6 ; Marchen # Mn [2] MARCHEN SIGN ANUSVARA..MARCHEN SIGN CANDRABINDU
+
+# Total code points: 68
+
+# ================================================
+
+11400..11434 ; Newa # Lo [53] NEWA LETTER A..NEWA LETTER HA
+11435..11437 ; Newa # Mc [3] NEWA VOWEL SIGN AA..NEWA VOWEL SIGN II
+11438..1143F ; Newa # Mn [8] NEWA VOWEL SIGN U..NEWA VOWEL SIGN AI
+11440..11441 ; Newa # Mc [2] NEWA VOWEL SIGN O..NEWA VOWEL SIGN AU
+11442..11444 ; Newa # Mn [3] NEWA SIGN VIRAMA..NEWA SIGN ANUSVARA
+11445 ; Newa # Mc NEWA SIGN VISARGA
+11446 ; Newa # Mn NEWA SIGN NUKTA
+11447..1144A ; Newa # Lo [4] NEWA SIGN AVAGRAHA..NEWA SIDDHI
+1144B..1144F ; Newa # Po [5] NEWA DANDA..NEWA ABBREVIATION SIGN
+11450..11459 ; Newa # Nd [10] NEWA DIGIT ZERO..NEWA DIGIT NINE
+1145A..1145B ; Newa # Po [2] NEWA DOUBLE COMMA..NEWA PLACEHOLDER MARK
+1145D ; Newa # Po NEWA INSERTION SIGN
+1145E ; Newa # Mn NEWA SANDHI MARK
+1145F..11461 ; Newa # Lo [3] NEWA LETTER VEDIC ANUSVARA..NEWA SIGN UPADHMANIYA
+
+# Total code points: 97
+
+# ================================================
+
+104B0..104D3 ; Osage # L& [36] OSAGE CAPITAL LETTER A..OSAGE CAPITAL LETTER ZHA
+104D8..104FB ; Osage # L& [36] OSAGE SMALL LETTER A..OSAGE SMALL LETTER ZHA
+
+# Total code points: 72
+
+# ================================================
+
+16FE0 ; Tangut # Lm TANGUT ITERATION MARK
+17000..187F7 ; Tangut # Lo [6136] TANGUT IDEOGRAPH-17000..TANGUT IDEOGRAPH-187F7
+18800..18AFF ; Tangut # Lo [768] TANGUT COMPONENT-001..TANGUT COMPONENT-768
+18D00..18D08 ; Tangut # Lo [9] TANGUT IDEOGRAPH-18D00..TANGUT IDEOGRAPH-18D08
+
+# Total code points: 6914
+
+# ================================================
+
+11D00..11D06 ; Masaram_Gondi # Lo [7] MASARAM GONDI LETTER A..MASARAM GONDI LETTER E
+11D08..11D09 ; Masaram_Gondi # Lo [2] MASARAM GONDI LETTER AI..MASARAM GONDI LETTER O
+11D0B..11D30 ; Masaram_Gondi # Lo [38] MASARAM GONDI LETTER AU..MASARAM GONDI LETTER TRA
+11D31..11D36 ; Masaram_Gondi # Mn [6] MASARAM GONDI VOWEL SIGN AA..MASARAM GONDI VOWEL SIGN VOCALIC R
+11D3A ; Masaram_Gondi # Mn MASARAM GONDI VOWEL SIGN E
+11D3C..11D3D ; Masaram_Gondi # Mn [2] MASARAM GONDI VOWEL SIGN AI..MASARAM GONDI VOWEL SIGN O
+11D3F..11D45 ; Masaram_Gondi # Mn [7] MASARAM GONDI VOWEL SIGN AU..MASARAM GONDI VIRAMA
+11D46 ; Masaram_Gondi # Lo MASARAM GONDI REPHA
+11D47 ; Masaram_Gondi # Mn MASARAM GONDI RA-KARA
+11D50..11D59 ; Masaram_Gondi # Nd [10] MASARAM GONDI DIGIT ZERO..MASARAM GONDI DIGIT NINE
+
+# Total code points: 75
+
+# ================================================
+
+16FE1 ; Nushu # Lm NUSHU ITERATION MARK
+1B170..1B2FB ; Nushu # Lo [396] NUSHU CHARACTER-1B170..NUSHU CHARACTER-1B2FB
+
+# Total code points: 397
+
+# ================================================
+
+11A50 ; Soyombo # Lo SOYOMBO LETTER A
+11A51..11A56 ; Soyombo # Mn [6] SOYOMBO VOWEL SIGN I..SOYOMBO VOWEL SIGN OE
+11A57..11A58 ; Soyombo # Mc [2] SOYOMBO VOWEL SIGN AI..SOYOMBO VOWEL SIGN AU
+11A59..11A5B ; Soyombo # Mn [3] SOYOMBO VOWEL SIGN VOCALIC R..SOYOMBO VOWEL LENGTH MARK
+11A5C..11A89 ; Soyombo # Lo [46] SOYOMBO LETTER KA..SOYOMBO CLUSTER-INITIAL LETTER SA
+11A8A..11A96 ; Soyombo # Mn [13] SOYOMBO FINAL CONSONANT SIGN G..SOYOMBO SIGN ANUSVARA
+11A97 ; Soyombo # Mc SOYOMBO SIGN VISARGA
+11A98..11A99 ; Soyombo # Mn [2] SOYOMBO GEMINATION MARK..SOYOMBO SUBJOINER
+11A9A..11A9C ; Soyombo # Po [3] SOYOMBO MARK TSHEG..SOYOMBO MARK DOUBLE SHAD
+11A9D ; Soyombo # Lo SOYOMBO MARK PLUTA
+11A9E..11AA2 ; Soyombo # Po [5] SOYOMBO HEAD MARK WITH MOON AND SUN AND TRIPLE FLAME..SOYOMBO TERMINAL MARK-2
+
+# Total code points: 83
+
+# ================================================
+
+11A00 ; Zanabazar_Square # Lo ZANABAZAR SQUARE LETTER A
+11A01..11A0A ; Zanabazar_Square # Mn [10] ZANABAZAR SQUARE VOWEL SIGN I..ZANABAZAR SQUARE VOWEL LENGTH MARK
+11A0B..11A32 ; Zanabazar_Square # Lo [40] ZANABAZAR SQUARE LETTER KA..ZANABAZAR SQUARE LETTER KSSA
+11A33..11A38 ; Zanabazar_Square # Mn [6] ZANABAZAR SQUARE FINAL CONSONANT MARK..ZANABAZAR SQUARE SIGN ANUSVARA
+11A39 ; Zanabazar_Square # Mc ZANABAZAR SQUARE SIGN VISARGA
+11A3A ; Zanabazar_Square # Lo ZANABAZAR SQUARE CLUSTER-INITIAL LETTER RA
+11A3B..11A3E ; Zanabazar_Square # Mn [4] ZANABAZAR SQUARE CLUSTER-FINAL LETTER YA..ZANABAZAR SQUARE CLUSTER-FINAL LETTER VA
+11A3F..11A46 ; Zanabazar_Square # Po [8] ZANABAZAR SQUARE INITIAL HEAD MARK..ZANABAZAR SQUARE CLOSING DOUBLE-LINED HEAD MARK
+11A47 ; Zanabazar_Square # Mn ZANABAZAR SQUARE SUBJOINER
+
+# Total code points: 72
+
+# ================================================
+
+11800..1182B ; Dogra # Lo [44] DOGRA LETTER A..DOGRA LETTER RRA
+1182C..1182E ; Dogra # Mc [3] DOGRA VOWEL SIGN AA..DOGRA VOWEL SIGN II
+1182F..11837 ; Dogra # Mn [9] DOGRA VOWEL SIGN U..DOGRA SIGN ANUSVARA
+11838 ; Dogra # Mc DOGRA SIGN VISARGA
+11839..1183A ; Dogra # Mn [2] DOGRA SIGN VIRAMA..DOGRA SIGN NUKTA
+1183B ; Dogra # Po DOGRA ABBREVIATION SIGN
+
+# Total code points: 60
+
+# ================================================
+
+11D60..11D65 ; Gunjala_Gondi # Lo [6] GUNJALA GONDI LETTER A..GUNJALA GONDI LETTER UU
+11D67..11D68 ; Gunjala_Gondi # Lo [2] GUNJALA GONDI LETTER EE..GUNJALA GONDI LETTER AI
+11D6A..11D89 ; Gunjala_Gondi # Lo [32] GUNJALA GONDI LETTER OO..GUNJALA GONDI LETTER SA
+11D8A..11D8E ; Gunjala_Gondi # Mc [5] GUNJALA GONDI VOWEL SIGN AA..GUNJALA GONDI VOWEL SIGN UU
+11D90..11D91 ; Gunjala_Gondi # Mn [2] GUNJALA GONDI VOWEL SIGN EE..GUNJALA GONDI VOWEL SIGN AI
+11D93..11D94 ; Gunjala_Gondi # Mc [2] GUNJALA GONDI VOWEL SIGN OO..GUNJALA GONDI VOWEL SIGN AU
+11D95 ; Gunjala_Gondi # Mn GUNJALA GONDI SIGN ANUSVARA
+11D96 ; Gunjala_Gondi # Mc GUNJALA GONDI SIGN VISARGA
+11D97 ; Gunjala_Gondi # Mn GUNJALA GONDI VIRAMA
+11D98 ; Gunjala_Gondi # Lo GUNJALA GONDI OM
+11DA0..11DA9 ; Gunjala_Gondi # Nd [10] GUNJALA GONDI DIGIT ZERO..GUNJALA GONDI DIGIT NINE
+
+# Total code points: 63
+
+# ================================================
+
+11EE0..11EF2 ; Makasar # Lo [19] MAKASAR LETTER KA..MAKASAR ANGKA
+11EF3..11EF4 ; Makasar # Mn [2] MAKASAR VOWEL SIGN I..MAKASAR VOWEL SIGN U
+11EF5..11EF6 ; Makasar # Mc [2] MAKASAR VOWEL SIGN E..MAKASAR VOWEL SIGN O
+11EF7..11EF8 ; Makasar # Po [2] MAKASAR PASSIMBANG..MAKASAR END OF SECTION
+
+# Total code points: 25
+
+# ================================================
+
+16E40..16E7F ; Medefaidrin # L& [64] MEDEFAIDRIN CAPITAL LETTER M..MEDEFAIDRIN SMALL LETTER Y
+16E80..16E96 ; Medefaidrin # No [23] MEDEFAIDRIN DIGIT ZERO..MEDEFAIDRIN DIGIT THREE ALTERNATE FORM
+16E97..16E9A ; Medefaidrin # Po [4] MEDEFAIDRIN COMMA..MEDEFAIDRIN EXCLAMATION OH
+
+# Total code points: 91
+
+# ================================================
+
+10D00..10D23 ; Hanifi_Rohingya # Lo [36] HANIFI ROHINGYA LETTER A..HANIFI ROHINGYA MARK NA KHONNA
+10D24..10D27 ; Hanifi_Rohingya # Mn [4] HANIFI ROHINGYA SIGN HARBAHAY..HANIFI ROHINGYA SIGN TASSI
+10D30..10D39 ; Hanifi_Rohingya # Nd [10] HANIFI ROHINGYA DIGIT ZERO..HANIFI ROHINGYA DIGIT NINE
+
+# Total code points: 50
+
+# ================================================
+
+10F30..10F45 ; Sogdian # Lo [22] SOGDIAN LETTER ALEPH..SOGDIAN INDEPENDENT SHIN
+10F46..10F50 ; Sogdian # Mn [11] SOGDIAN COMBINING DOT BELOW..SOGDIAN COMBINING STROKE BELOW
+10F51..10F54 ; Sogdian # No [4] SOGDIAN NUMBER ONE..SOGDIAN NUMBER ONE HUNDRED
+10F55..10F59 ; Sogdian # Po [5] SOGDIAN PUNCTUATION TWO VERTICAL BARS..SOGDIAN PUNCTUATION HALF CIRCLE WITH DOT
+
+# Total code points: 42
+
+# ================================================
+
+10F00..10F1C ; Old_Sogdian # Lo [29] OLD SOGDIAN LETTER ALEPH..OLD SOGDIAN LETTER FINAL TAW WITH VERTICAL TAIL
+10F1D..10F26 ; Old_Sogdian # No [10] OLD SOGDIAN NUMBER ONE..OLD SOGDIAN FRACTION ONE HALF
+10F27 ; Old_Sogdian # Lo OLD SOGDIAN LIGATURE AYIN-DALETH
+
+# Total code points: 40
+
+# ================================================
+
+10FE0..10FF6 ; Elymaic # Lo [23] ELYMAIC LETTER ALEPH..ELYMAIC LIGATURE ZAYIN-YODH
+
+# Total code points: 23
+
+# ================================================
+
+119A0..119A7 ; Nandinagari # Lo [8] NANDINAGARI LETTER A..NANDINAGARI LETTER VOCALIC RR
+119AA..119D0 ; Nandinagari # Lo [39] NANDINAGARI LETTER E..NANDINAGARI LETTER RRA
+119D1..119D3 ; Nandinagari # Mc [3] NANDINAGARI VOWEL SIGN AA..NANDINAGARI VOWEL SIGN II
+119D4..119D7 ; Nandinagari # Mn [4] NANDINAGARI VOWEL SIGN U..NANDINAGARI VOWEL SIGN VOCALIC RR
+119DA..119DB ; Nandinagari # Mn [2] NANDINAGARI VOWEL SIGN E..NANDINAGARI VOWEL SIGN AI
+119DC..119DF ; Nandinagari # Mc [4] NANDINAGARI VOWEL SIGN O..NANDINAGARI SIGN VISARGA
+119E0 ; Nandinagari # Mn NANDINAGARI SIGN VIRAMA
+119E1 ; Nandinagari # Lo NANDINAGARI SIGN AVAGRAHA
+119E2 ; Nandinagari # Po NANDINAGARI SIGN SIDDHAM
+119E3 ; Nandinagari # Lo NANDINAGARI HEADSTROKE
+119E4 ; Nandinagari # Mc NANDINAGARI VOWEL SIGN PRISHTHAMATRA E
+
+# Total code points: 65
+
+# ================================================
+
+1E100..1E12C ; Nyiakeng_Puachue_Hmong # Lo [45] NYIAKENG PUACHUE HMONG LETTER MA..NYIAKENG PUACHUE HMONG LETTER W
+1E130..1E136 ; Nyiakeng_Puachue_Hmong # Mn [7] NYIAKENG PUACHUE HMONG TONE-B..NYIAKENG PUACHUE HMONG TONE-D
+1E137..1E13D ; Nyiakeng_Puachue_Hmong # Lm [7] NYIAKENG PUACHUE HMONG SIGN FOR PERSON..NYIAKENG PUACHUE HMONG SYLLABLE LENGTHENER
+1E140..1E149 ; Nyiakeng_Puachue_Hmong # Nd [10] NYIAKENG PUACHUE HMONG DIGIT ZERO..NYIAKENG PUACHUE HMONG DIGIT NINE
+1E14E ; Nyiakeng_Puachue_Hmong # Lo NYIAKENG PUACHUE HMONG LOGOGRAM NYAJ
+1E14F ; Nyiakeng_Puachue_Hmong # So NYIAKENG PUACHUE HMONG CIRCLED CA
+
+# Total code points: 71
+
+# ================================================
+
+1E2C0..1E2EB ; Wancho # Lo [44] WANCHO LETTER AA..WANCHO LETTER YIH
+1E2EC..1E2EF ; Wancho # Mn [4] WANCHO TONE TUP..WANCHO TONE KOINI
+1E2F0..1E2F9 ; Wancho # Nd [10] WANCHO DIGIT ZERO..WANCHO DIGIT NINE
+1E2FF ; Wancho # Sc WANCHO NGUN SIGN
+
+# Total code points: 59
+
+# ================================================
+
+10FB0..10FC4 ; Chorasmian # Lo [21] CHORASMIAN LETTER ALEPH..CHORASMIAN LETTER TAW
+10FC5..10FCB ; Chorasmian # No [7] CHORASMIAN NUMBER ONE..CHORASMIAN NUMBER ONE HUNDRED
+
+# Total code points: 28
+
+# ================================================
+
+11900..11906 ; Dives_Akuru # Lo [7] DIVES AKURU LETTER A..DIVES AKURU LETTER E
+11909 ; Dives_Akuru # Lo DIVES AKURU LETTER O
+1190C..11913 ; Dives_Akuru # Lo [8] DIVES AKURU LETTER KA..DIVES AKURU LETTER JA
+11915..11916 ; Dives_Akuru # Lo [2] DIVES AKURU LETTER NYA..DIVES AKURU LETTER TTA
+11918..1192F ; Dives_Akuru # Lo [24] DIVES AKURU LETTER DDA..DIVES AKURU LETTER ZA
+11930..11935 ; Dives_Akuru # Mc [6] DIVES AKURU VOWEL SIGN AA..DIVES AKURU VOWEL SIGN E
+11937..11938 ; Dives_Akuru # Mc [2] DIVES AKURU VOWEL SIGN AI..DIVES AKURU VOWEL SIGN O
+1193B..1193C ; Dives_Akuru # Mn [2] DIVES AKURU SIGN ANUSVARA..DIVES AKURU SIGN CANDRABINDU
+1193D ; Dives_Akuru # Mc DIVES AKURU SIGN HALANTA
+1193E ; Dives_Akuru # Mn DIVES AKURU VIRAMA
+1193F ; Dives_Akuru # Lo DIVES AKURU PREFIXED NASAL SIGN
+11940 ; Dives_Akuru # Mc DIVES AKURU MEDIAL YA
+11941 ; Dives_Akuru # Lo DIVES AKURU INITIAL RA
+11942 ; Dives_Akuru # Mc DIVES AKURU MEDIAL RA
+11943 ; Dives_Akuru # Mn DIVES AKURU SIGN NUKTA
+11944..11946 ; Dives_Akuru # Po [3] DIVES AKURU DOUBLE DANDA..DIVES AKURU END OF TEXT MARK
+11950..11959 ; Dives_Akuru # Nd [10] DIVES AKURU DIGIT ZERO..DIVES AKURU DIGIT NINE
+
+# Total code points: 72
+
+# ================================================
+
+16FE4 ; Khitan_Small_Script # Mn KHITAN SMALL SCRIPT FILLER
+18B00..18CD5 ; Khitan_Small_Script # Lo [470] KHITAN SMALL SCRIPT CHARACTER-18B00..KHITAN SMALL SCRIPT CHARACTER-18CD5
+
+# Total code points: 471
+
+# ================================================
+
+10E80..10EA9 ; Yezidi # Lo [42] YEZIDI LETTER ELIF..YEZIDI LETTER ET
+10EAB..10EAC ; Yezidi # Mn [2] YEZIDI COMBINING HAMZA MARK..YEZIDI COMBINING MADDA MARK
+10EAD ; Yezidi # Pd YEZIDI HYPHENATION MARK
+10EB0..10EB1 ; Yezidi # Lo [2] YEZIDI LETTER LAM WITH DOT ABOVE..YEZIDI LETTER YOT WITH CIRCUMFLEX ABOVE
+
+# Total code points: 47
+
+# ================================================
+
+12F90..12FF0 ; Cypro_Minoan # Lo [97] CYPRO-MINOAN SIGN CM001..CYPRO-MINOAN SIGN CM114
+12FF1..12FF2 ; Cypro_Minoan # Po [2] CYPRO-MINOAN SIGN CM301..CYPRO-MINOAN SIGN CM302
+
+# Total code points: 99
+
+# ================================================
+
+10F70..10F81 ; Old_Uyghur # Lo [18] OLD UYGHUR LETTER ALEPH..OLD UYGHUR LETTER LESH
+10F82..10F85 ; Old_Uyghur # Mn [4] OLD UYGHUR COMBINING DOT ABOVE..OLD UYGHUR COMBINING TWO DOTS BELOW
+10F86..10F89 ; Old_Uyghur # Po [4] OLD UYGHUR PUNCTUATION BAR..OLD UYGHUR PUNCTUATION FOUR DOTS
+
+# Total code points: 26
+
+# ================================================
+
+16A70..16ABE ; Tangsa # Lo [79] TANGSA LETTER OZ..TANGSA LETTER ZA
+16AC0..16AC9 ; Tangsa # Nd [10] TANGSA DIGIT ZERO..TANGSA DIGIT NINE
+
+# Total code points: 89
+
+# ================================================
+
+1E290..1E2AD ; Toto # Lo [30] TOTO LETTER PA..TOTO LETTER A
+1E2AE ; Toto # Mn TOTO SIGN RISING TONE
+
+# Total code points: 31
+
+# ================================================
+
+10570..1057A ; Vithkuqi # L& [11] VITHKUQI CAPITAL LETTER A..VITHKUQI CAPITAL LETTER GA
+1057C..1058A ; Vithkuqi # L& [15] VITHKUQI CAPITAL LETTER HA..VITHKUQI CAPITAL LETTER RE
+1058C..10592 ; Vithkuqi # L& [7] VITHKUQI CAPITAL LETTER SE..VITHKUQI CAPITAL LETTER XE
+10594..10595 ; Vithkuqi # L& [2] VITHKUQI CAPITAL LETTER Y..VITHKUQI CAPITAL LETTER ZE
+10597..105A1 ; Vithkuqi # L& [11] VITHKUQI SMALL LETTER A..VITHKUQI SMALL LETTER GA
+105A3..105B1 ; Vithkuqi # L& [15] VITHKUQI SMALL LETTER HA..VITHKUQI SMALL LETTER RE
+105B3..105B9 ; Vithkuqi # L& [7] VITHKUQI SMALL LETTER SE..VITHKUQI SMALL LETTER XE
+105BB..105BC ; Vithkuqi # L& [2] VITHKUQI SMALL LETTER Y..VITHKUQI SMALL LETTER ZE
+
+# Total code points: 70
+
+# ================================================
+
+11F00..11F01 ; Kawi # Mn [2] KAWI SIGN CANDRABINDU..KAWI SIGN ANUSVARA
+11F02 ; Kawi # Lo KAWI SIGN REPHA
+11F03 ; Kawi # Mc KAWI SIGN VISARGA
+11F04..11F10 ; Kawi # Lo [13] KAWI LETTER A..KAWI LETTER O
+11F12..11F33 ; Kawi # Lo [34] KAWI LETTER KA..KAWI LETTER JNYA
+11F34..11F35 ; Kawi # Mc [2] KAWI VOWEL SIGN AA..KAWI VOWEL SIGN ALTERNATE AA
+11F36..11F3A ; Kawi # Mn [5] KAWI VOWEL SIGN I..KAWI VOWEL SIGN VOCALIC R
+11F3E..11F3F ; Kawi # Mc [2] KAWI VOWEL SIGN E..KAWI VOWEL SIGN AI
+11F40 ; Kawi # Mn KAWI VOWEL SIGN EU
+11F41 ; Kawi # Mc KAWI SIGN KILLER
+11F42 ; Kawi # Mn KAWI CONJOINER
+11F43..11F4F ; Kawi # Po [13] KAWI DANDA..KAWI PUNCTUATION CLOSING SPIRAL
+11F50..11F59 ; Kawi # Nd [10] KAWI DIGIT ZERO..KAWI DIGIT NINE
+
+# Total code points: 86
+
+# ================================================
+
+1E4D0..1E4EA ; Nag_Mundari # Lo [27] NAG MUNDARI LETTER O..NAG MUNDARI LETTER ELL
+1E4EB ; Nag_Mundari # Lm NAG MUNDARI SIGN OJOD
+1E4EC..1E4EF ; Nag_Mundari # Mn [4] NAG MUNDARI SIGN MUHOR..NAG MUNDARI SIGN SUTUH
+1E4F0..1E4F9 ; Nag_Mundari # Nd [10] NAG MUNDARI DIGIT ZERO..NAG MUNDARI DIGIT NINE
+
+# Total code points: 42
+
+# EOF
diff --git a/gen/data-files b/gen/data-files
index b2c4197..5b7921c 100755
--- a/gen/data-files
+++ b/gen/data-files
@@ -21,6 +21,7 @@ extracted/DerivedLineBreak
extracted/DerivedNumericType
extracted/DerivedNumericValues
PropList
+Scripts
SpecialCasing
UnicodeData
'
diff --git a/gen/prop/sc b/gen/prop/sc
new file mode 100755
index 0000000..40fc39b
--- /dev/null
+++ b/gen/prop/sc
@@ -0,0 +1,232 @@
+#!/bin/sh
+
+#!/bin/sh
+
+set -e
+cd "${0%/*}/../.."
+exec >lib/unicode/prop/uprop_get_sc.c
+
+gawk '
+BEGIN {
+ FS = " *(; *|#.*)"
+
+ map["Adlam"] = "ADLM"
+ map["Caucasian_Albanian"] = "AGHB"
+ map["Ahom"] = "AHOM"
+ map["Arabic"] = "ARAB"
+ map["Imperial_Aramaic"] = "ARMI"
+ map["Armenian"] = "ARMN"
+ map["Avestan"] = "AVST"
+ map["Balinese"] = "BALI"
+ map["Bamum"] = "BAMU"
+ map["Bassa_Vah"] = "BASS"
+ map["Batak"] = "BATK"
+ map["Bengali"] = "BENG"
+ map["Bhaiksuki"] = "BHKS"
+ map["Bopomofo"] = "BOPO"
+ map["Brahmi"] = "BRAH"
+ map["Braille"] = "BRAI"
+ map["Buginese"] = "BUGI"
+ map["Buhid"] = "BUHD"
+ map["Chakma"] = "CAKM"
+ map["Canadian_Aboriginal"] = "CANS"
+ map["Carian"] = "CARI"
+ map["Cham"] = "CHAM"
+ map["Cherokee"] = "CHER"
+ map["Chorasmian"] = "CHRS"
+ map["Coptic"] = "COPT"
+ map["Cypro_Minoan"] = "CPMN"
+ map["Cypriot"] = "CPRT"
+ map["Cyrillic"] = "CYRL"
+ map["Devanagari"] = "DEVA"
+ map["Dives_Akuru"] = "DIAK"
+ map["Dogra"] = "DOGR"
+ map["Deseret"] = "DSRT"
+ map["Duployan"] = "DUPL"
+ map["Egyptian_Hieroglyphs"] = "EGYP"
+ map["Elbasan"] = "ELBA"
+ map["Elymaic"] = "ELYM"
+ map["Ethiopic"] = "ETHI"
+ map["Georgian"] = "GEOR"
+ map["Glagolitic"] = "GLAG"
+ map["Gunjala_Gondi"] = "GONG"
+ map["Masaram_Gondi"] = "GONM"
+ map["Gothic"] = "GOTH"
+ map["Grantha"] = "GRAN"
+ map["Greek"] = "GREK"
+ map["Gujarati"] = "GUJR"
+ map["Gurmukhi"] = "GURU"
+ map["Hangul"] = "HANG"
+ map["Han"] = "HANI"
+ map["Hanunoo"] = "HANO"
+ map["Hatran"] = "HATR"
+ map["Hebrew"] = "HEBR"
+ map["Hiragana"] = "HIRA"
+ map["Anatolian_Hieroglyphs"] = "HLUW"
+ map["Pahawh_Hmong"] = "HMNG"
+ map["Nyiakeng_Puachue_Hmong"] = "HMNP"
+ map["Katakana_Or_Hiragana"] = "HRKT"
+ map["Old_Hungarian"] = "HUNG"
+ map["Old_Italic"] = "ITAL"
+ map["Javanese"] = "JAVA"
+ map["Kayah_Li"] = "KALI"
+ map["Katakana"] = "KANA"
+ map["Kawi"] = "KAWI"
+ map["Kharoshthi"] = "KHAR"
+ map["Khmer"] = "KHMR"
+ map["Khojki"] = "KHOJ"
+ map["Khitan_Small_Script"] = "KITS"
+ map["Kannada"] = "KNDA"
+ map["Kaithi"] = "KTHI"
+ map["Tai_Tham"] = "LANA"
+ map["Lao"] = "LAOO"
+ map["Latin"] = "LATN"
+ map["Lepcha"] = "LEPC"
+ map["Limbu"] = "LIMB"
+ map["Linear_A"] = "LINA"
+ map["Linear_B"] = "LINB"
+ map["Lisu"] = "LISU"
+ map["Lycian"] = "LYCI"
+ map["Lydian"] = "LYDI"
+ map["Mahajani"] = "MAHJ"
+ map["Makasar"] = "MAKA"
+ map["Mandaic"] = "MAND"
+ map["Manichaean"] = "MANI"
+ map["Marchen"] = "MARC"
+ map["Medefaidrin"] = "MEDF"
+ map["Mende_Kikakui"] = "MEND"
+ map["Meroitic_Cursive"] = "MERC"
+ map["Meroitic_Hieroglyphs"] = "MERO"
+ map["Malayalam"] = "MLYM"
+ map["Modi"] = "MODI"
+ map["Mongolian"] = "MONG"
+ map["Mro"] = "MROO"
+ map["Meetei_Mayek"] = "MTEI"
+ map["Multani"] = "MULT"
+ map["Myanmar"] = "MYMR"
+ map["Nag_Mundari"] = "NAGM"
+ map["Nandinagari"] = "NAND"
+ map["Old_North_Arabian"] = "NARB"
+ map["Nabataean"] = "NBAT"
+ map["Newa"] = "NEWA"
+ map["Nko"] = "NKOO"
+ map["Nushu"] = "NSHU"
+ map["Ogham"] = "OGAM"
+ map["Ol_Chiki"] = "OLCK"
+ map["Old_Turkic"] = "ORKH"
+ map["Oriya"] = "ORYA"
+ map["Osage"] = "OSGE"
+ map["Osmanya"] = "OSMA"
+ map["Old_Uyghur"] = "OUGR"
+ map["Palmyrene"] = "PALM"
+ map["Pau_Cin_Hau"] = "PAUC"
+ map["Old_Permic"] = "PERM"
+ map["Phags_Pa"] = "PHAG"
+ map["Inscriptional_Pahlavi"] = "PHLI"
+ map["Psalter_Pahlavi"] = "PHLP"
+ map["Phoenician"] = "PHNX"
+ map["Miao"] = "PLRD"
+ map["Inscriptional_Parthian"] = "PRTI"
+ map["Rejang"] = "RJNG"
+ map["Hanifi_Rohingya"] = "ROHG"
+ map["Runic"] = "RUNR"
+ map["Samaritan"] = "SAMR"
+ map["Old_South_Arabian"] = "SARB"
+ map["Saurashtra"] = "SAUR"
+ map["SignWriting"] = "SGNW"
+ map["Shavian"] = "SHAW"
+ map["Sharada"] = "SHRD"
+ map["Siddham"] = "SIDD"
+ map["Khudawadi"] = "SIND"
+ map["Sinhala"] = "SINH"
+ map["Sogdian"] = "SOGD"
+ map["Old_Sogdian"] = "SOGO"
+ map["Sora_Sompeng"] = "SORA"
+ map["Soyombo"] = "SOYO"
+ map["Sundanese"] = "SUND"
+ map["Syloti_Nagri"] = "SYLO"
+ map["Syriac"] = "SYRC"
+ map["Tagbanwa"] = "TAGB"
+ map["Takri"] = "TAKR"
+ map["Tai_Le"] = "TALE"
+ map["New_Tai_Lue"] = "TALU"
+ map["Tamil"] = "TAML"
+ map["Tangut"] = "TANG"
+ map["Tai_Viet"] = "TAVT"
+ map["Telugu"] = "TELU"
+ map["Tifinagh"] = "TFNG"
+ map["Tagalog"] = "TGLG"
+ map["Thaana"] = "THAA"
+ map["Thai"] = "THAI"
+ map["Tibetan"] = "TIBT"
+ map["Tirhuta"] = "TIRH"
+ map["Tangsa"] = "TNSA"
+ map["Toto"] = "TOTO"
+ map["Ugaritic"] = "UGAR"
+ map["Vai"] = "VAII"
+ map["Vithkuqi"] = "VITH"
+ map["Warang_Citi"] = "WARA"
+ map["Wancho"] = "WCHO"
+ map["Old_Persian"] = "XPEO"
+ map["Cuneiform"] = "XSUX"
+ map["Yezidi"] = "YEZI"
+ map["Yi"] = "YIII"
+ map["Zanabazar_Square"] = "ZANB"
+ map["Inherited"] = "ZINH"
+ map["Common"] = "ZYYY"
+
+ print "/* This file is autogenerated by gen/prop/sc; DO NOT EDIT. */"
+ print ""
+ print "#include \"__bsearch.h\""
+ print "#include \"macros.h\""
+ print "#include \"rune.h\""
+ print "#include \"unicode/prop.h\""
+ print ""
+}
+
+/^[^#]/ {
+ n = split($1, a, /\.\./)
+ lo = strtonum("0X" a[1])
+ hi = strtonum("0X" a[n])
+
+ for (i = lo; i <= hi; i++) {
+ gsub(/^; /, "", $2)
+ props[i] = "SC_" map[$2]
+ }
+}
+
+END {
+ print "static constexpr enum uprop_sc lookup_lat1[] = {"
+ for (i = 0; i < 0x100; i++) {
+ if (i % 8 == 0)
+ printf "\t"
+ printf "%-7s,%s", props[i] ? props[i] : 0, i % 8 == 7 ? "\n" : " "
+ }
+ print "};"
+ print ""
+
+ print "static const struct {"
+ print "\trune lo, hi;"
+ print "\tenum uprop_sc val;"
+ print "} lookup[] = {"
+
+ for (i = 0x100; i <= 0x10FFFF; i++) {
+ if (!props[i])
+ continue
+ lo = i
+ while (props[lo] == props[i + 1])
+ i++
+ printf "\t{RUNE_C(0x%06X), RUNE_C(0x%06X), %s},\n", lo, i, props[i]
+ }
+
+ print "};"
+ print ""
+ print "__MLIB_DEFINE_BSEARCH(enum uprop_sc, lookup, SC_ZZZZ)"
+ print ""
+ print "enum uprop_sc"
+ print "uprop_get_sc(rune ch)"
+ print "{"
+ print "\treturn ch <= lengthof(lookup_lat1) ? lookup_lat1[ch] : mlib_lookup(ch);"
+ print "}"
+}
+' data/Scripts | sed 's/\s*$//'
diff --git a/include/unicode/prop.h b/include/unicode/prop.h
index fd6c027..419908e 100644
--- a/include/unicode/prop.h
+++ b/include/unicode/prop.h
@@ -554,6 +554,174 @@ enum uprop_nt {
NT_NU, /* Numeric */
};
+enum uprop_sc {
+ SC_ZZZZ = 0, /* Unknown */
+ SC_ADLM, /* Adlam */
+ SC_AGHB, /* Caucasian Albanian */
+ SC_AHOM, /* Ahom */
+ SC_ARAB, /* Arabic */
+ SC_ARMI, /* Imperial Aramaic */
+ SC_ARMN, /* Armenian */
+ SC_AVST, /* Avestan */
+ SC_BALI, /* Balinese */
+ SC_BAMU, /* Bamum */
+ SC_BASS, /* Bassa Vah */
+ SC_BATK, /* Batak */
+ SC_BENG, /* Bengali */
+ SC_BHKS, /* Bhaiksuki */
+ SC_BOPO, /* Bopomofo */
+ SC_BRAH, /* Brahmi */
+ SC_BRAI, /* Braille */
+ SC_BUGI, /* Buginese */
+ SC_BUHD, /* Buhid */
+ SC_CAKM, /* Chakma */
+ SC_CANS, /* Canadian Aboriginal */
+ SC_CARI, /* Carian */
+ SC_CHAM, /* Cham */
+ SC_CHER, /* Cherokee */
+ SC_CHRS, /* Chorasmian */
+ SC_COPT, /* Coptic */
+ SC_CPMN, /* Cypro Minoan */
+ SC_CPRT, /* Cypriot */
+ SC_CYRL, /* Cyrillic */
+ SC_DEVA, /* Devanagari */
+ SC_DIAK, /* Dives Akuru */
+ SC_DOGR, /* Dogra */
+ SC_DSRT, /* Deseret */
+ SC_DUPL, /* Duployan */
+ SC_EGYP, /* Egyptian Hieroglyphs */
+ SC_ELBA, /* Elbasan */
+ SC_ELYM, /* Elymaic */
+ SC_ETHI, /* Ethiopic */
+ SC_GEOR, /* Georgian */
+ SC_GLAG, /* Glagolitic */
+ SC_GONG, /* Gunjala Gondi */
+ SC_GONM, /* Masaram Gondi */
+ SC_GOTH, /* Gothic */
+ SC_GRAN, /* Grantha */
+ SC_GREK, /* Greek */
+ SC_GUJR, /* Gujarati */
+ SC_GURU, /* Gurmukhi */
+ SC_HANG, /* Hangul */
+ SC_HANI, /* Han */
+ SC_HANO, /* Hanunoo */
+ SC_HATR, /* Hatran */
+ SC_HEBR, /* Hebrew */
+ SC_HIRA, /* Hiragana */
+ SC_HLUW, /* Anatolian Hieroglyphs */
+ SC_HMNG, /* Pahawh Hmong */
+ SC_HMNP, /* Nyiakeng Puachue Hmong */
+ SC_HRKT, /* Katakana or Hiragana */
+ SC_HUNG, /* Old Hungarian */
+ SC_ITAL, /* Old Italic */
+ SC_JAVA, /* Javanese */
+ SC_KALI, /* Kayah Li */
+ SC_KANA, /* Katakana */
+ SC_KAWI, /* Kawi */
+ SC_KHAR, /* Kharoshthi */
+ SC_KHMR, /* Khmer */
+ SC_KHOJ, /* Khojki */
+ SC_KITS, /* Khitan Small Script */
+ SC_KNDA, /* Kannada */
+ SC_KTHI, /* Kaithi */
+ SC_LANA, /* Tai Tham */
+ SC_LAOO, /* Lao */
+ SC_LATN, /* Latin */
+ SC_LEPC, /* Lepcha */
+ SC_LIMB, /* Limbu */
+ SC_LINA, /* Linear-A */
+ SC_LINB, /* Linear-B */
+ SC_LISU, /* Lisu */
+ SC_LYCI, /* Lycian */
+ SC_LYDI, /* Lydian */
+ SC_MAHJ, /* Mahajani */
+ SC_MAKA, /* Makasar */
+ SC_MAND, /* Mandaic */
+ SC_MANI, /* Manichaean */
+ SC_MARC, /* Marchen */
+ SC_MEDF, /* Medefaidrin */
+ SC_MEND, /* Mende Kikakui */
+ SC_MERC, /* Meroitic Cursive */
+ SC_MERO, /* Meroitic Hieroglyphs */
+ SC_MLYM, /* Malayalam */
+ SC_MODI, /* Modi */
+ SC_MONG, /* Mongolian */
+ SC_MROO, /* Mro */
+ SC_MTEI, /* Meetei Mayek */
+ SC_MULT, /* Multani */
+ SC_MYMR, /* Myanmar */
+ SC_NAGM, /* Nag Mundari */
+ SC_NAND, /* Nandinagari */
+ SC_NARB, /* Old North Arabian */
+ SC_NBAT, /* Nabataean */
+ SC_NEWA, /* Newa */
+ SC_NKOO, /* Nko */
+ SC_NSHU, /* Nushu */
+ SC_OGAM, /* Ogham */
+ SC_OLCK, /* Ol Chiki */
+ SC_ORKH, /* Old Turkic */
+ SC_ORYA, /* Oriya */
+ SC_OSGE, /* Osage */
+ SC_OSMA, /* Osmanya */
+ SC_OUGR, /* Old Uyghur */
+ SC_PALM, /* Palmyrene */
+ SC_PAUC, /* Pau Cin Hau */
+ SC_PERM, /* Old Permic */
+ SC_PHAG, /* Phags Pa */
+ SC_PHLI, /* Inscriptional Pahlavi */
+ SC_PHLP, /* Psalter Pahlavi */
+ SC_PHNX, /* Phoenician */
+ SC_PLRD, /* Miao */
+ SC_PRTI, /* Inscriptional Parthian */
+ SC_RJNG, /* Rejang */
+ SC_ROHG, /* Hanifi Rohingya */
+ SC_RUNR, /* Runic */
+ SC_SAMR, /* Samaritan */
+ SC_SARB, /* Old South Arabian */
+ SC_SAUR, /* Saurashtra */
+ SC_SGNW, /* SignWriting */
+ SC_SHAW, /* Shavian */
+ SC_SHRD, /* Sharada */
+ SC_SIDD, /* Siddham */
+ SC_SIND, /* Khudawadi */
+ SC_SINH, /* Sinhala */
+ SC_SOGD, /* Sogdian */
+ SC_SOGO, /* Old Sogdian */
+ SC_SORA, /* Sora Sompeng */
+ SC_SOYO, /* Soyombo */
+ SC_SUND, /* Sundanese */
+ SC_SYLO, /* Syloti Nagri */
+ SC_SYRC, /* Syriac */
+ SC_TAGB, /* Tagbanwa */
+ SC_TAKR, /* Takri */
+ SC_TALE, /* Tai Le */
+ SC_TALU, /* New Tai Lue */
+ SC_TAML, /* Tamil */
+ SC_TANG, /* Tangut */
+ SC_TAVT, /* Tai Viet */
+ SC_TELU, /* Telugu */
+ SC_TFNG, /* Tifinagh */
+ SC_TGLG, /* Tagalog */
+ SC_THAA, /* Thaana */
+ SC_THAI, /* Thai */
+ SC_TIBT, /* Tibetan */
+ SC_TIRH, /* Tirhuta */
+ SC_TNSA, /* Tangsa */
+ SC_TOTO, /* Toto */
+ SC_UGAR, /* Ugaritic */
+ SC_VAII, /* Vai */
+ SC_VITH, /* Vithkuqi */
+ SC_WARA, /* Warang Citi */
+ SC_WCHO, /* Wancho */
+ SC_XPEO, /* Old Persian */
+ SC_XSUX, /* Cuneiform */
+ SC_YEZI, /* Yezidi */
+ SC_YIII, /* Yi */
+ SC_ZANB, /* Zanabazar Square */
+ SC_ZINH, /* Inherited */
+ SC_ZYYY, /* Common */
+};
+
/* Not a Unicode property; but a nice-to-have */
[[__mlib_uprop_attrs]] struct u8view uprop_blkname(enum uprop_blk);
@@ -566,6 +734,7 @@ enum uprop_nt {
[[__mlib_uprop_attrs]] enum uprop_gc uprop_get_gc(rune);
[[__mlib_uprop_attrs]] enum uprop_lb uprop_get_lb(rune);
[[__mlib_uprop_attrs]] enum uprop_nt uprop_get_nt(rune);
+[[__mlib_uprop_attrs]] enum uprop_sc uprop_get_sc(rune);
[[__mlib_uprop_attrs]] rune uprop_get_bpb(rune);
[[__mlib_uprop_attrs]] rune uprop_get_slc(rune);
[[__mlib_uprop_attrs]] rune uprop_get_stc(rune);
diff --git a/lib/unicode/prop/uprop_get_sc.c b/lib/unicode/prop/uprop_get_sc.c
new file mode 100644
index 0000000..531c0c7
--- /dev/null
+++ b/lib/unicode/prop/uprop_get_sc.c
@@ -0,0 +1,995 @@
+/* This file is autogenerated by gen/prop/sc; DO NOT EDIT. */
+
+#include "__bsearch.h"
+#include "macros.h"
+#include "rune.h"
+#include "unicode/prop.h"
+
+static constexpr enum uprop_sc lookup_lat1[] = {
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_LATN, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_ZYYY, SC_ZYYY, SC_LATN, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY, SC_ZYYY,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_ZYYY,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_ZYYY,
+ SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN, SC_LATN,
+};
+
+static const struct {
+ rune lo, hi;
+ enum uprop_sc val;
+} lookup[] = {
+ {RUNE_C(0x000100), RUNE_C(0x0002B8), SC_LATN},
+ {RUNE_C(0x0002B9), RUNE_C(0x0002DF), SC_ZYYY},
+ {RUNE_C(0x0002E0), RUNE_C(0x0002E4), SC_LATN},
+ {RUNE_C(0x0002E5), RUNE_C(0x0002E9), SC_ZYYY},
+ {RUNE_C(0x0002EA), RUNE_C(0x0002EB), SC_BOPO},
+ {RUNE_C(0x0002EC), RUNE_C(0x0002FF), SC_ZYYY},
+ {RUNE_C(0x000300), RUNE_C(0x00036F), SC_ZINH},
+ {RUNE_C(0x000370), RUNE_C(0x000373), SC_GREK},
+ {RUNE_C(0x000374), RUNE_C(0x000374), SC_ZYYY},
+ {RUNE_C(0x000375), RUNE_C(0x000377), SC_GREK},
+ {RUNE_C(0x00037A), RUNE_C(0x00037D), SC_GREK},
+ {RUNE_C(0x00037E), RUNE_C(0x00037E), SC_ZYYY},
+ {RUNE_C(0x00037F), RUNE_C(0x00037F), SC_GREK},
+ {RUNE_C(0x000384), RUNE_C(0x000384), SC_GREK},
+ {RUNE_C(0x000385), RUNE_C(0x000385), SC_ZYYY},
+ {RUNE_C(0x000386), RUNE_C(0x000386), SC_GREK},
+ {RUNE_C(0x000387), RUNE_C(0x000387), SC_ZYYY},
+ {RUNE_C(0x000388), RUNE_C(0x00038A), SC_GREK},
+ {RUNE_C(0x00038C), RUNE_C(0x00038C), SC_GREK},
+ {RUNE_C(0x00038E), RUNE_C(0x0003A1), SC_GREK},
+ {RUNE_C(0x0003A3), RUNE_C(0x0003E1), SC_GREK},
+ {RUNE_C(0x0003E2), RUNE_C(0x0003EF), SC_COPT},
+ {RUNE_C(0x0003F0), RUNE_C(0x0003FF), SC_GREK},
+ {RUNE_C(0x000400), RUNE_C(0x000484), SC_CYRL},
+ {RUNE_C(0x000485), RUNE_C(0x000486), SC_ZINH},
+ {RUNE_C(0x000487), RUNE_C(0x00052F), SC_CYRL},
+ {RUNE_C(0x000531), RUNE_C(0x000556), SC_ARMN},
+ {RUNE_C(0x000559), RUNE_C(0x00058A), SC_ARMN},
+ {RUNE_C(0x00058D), RUNE_C(0x00058F), SC_ARMN},
+ {RUNE_C(0x000591), RUNE_C(0x0005C7), SC_HEBR},
+ {RUNE_C(0x0005D0), RUNE_C(0x0005EA), SC_HEBR},
+ {RUNE_C(0x0005EF), RUNE_C(0x0005F4), SC_HEBR},
+ {RUNE_C(0x000600), RUNE_C(0x000604), SC_ARAB},
+ {RUNE_C(0x000605), RUNE_C(0x000605), SC_ZYYY},
+ {RUNE_C(0x000606), RUNE_C(0x00060B), SC_ARAB},
+ {RUNE_C(0x00060C), RUNE_C(0x00060C), SC_ZYYY},
+ {RUNE_C(0x00060D), RUNE_C(0x00061A), SC_ARAB},
+ {RUNE_C(0x00061B), RUNE_C(0x00061B), SC_ZYYY},
+ {RUNE_C(0x00061C), RUNE_C(0x00061E), SC_ARAB},
+ {RUNE_C(0x00061F), RUNE_C(0x00061F), SC_ZYYY},
+ {RUNE_C(0x000620), RUNE_C(0x00063F), SC_ARAB},
+ {RUNE_C(0x000640), RUNE_C(0x000640), SC_ZYYY},
+ {RUNE_C(0x000641), RUNE_C(0x00064A), SC_ARAB},
+ {RUNE_C(0x00064B), RUNE_C(0x000655), SC_ZINH},
+ {RUNE_C(0x000656), RUNE_C(0x00066F), SC_ARAB},
+ {RUNE_C(0x000670), RUNE_C(0x000670), SC_ZINH},
+ {RUNE_C(0x000671), RUNE_C(0x0006DC), SC_ARAB},
+ {RUNE_C(0x0006DD), RUNE_C(0x0006DD), SC_ZYYY},
+ {RUNE_C(0x0006DE), RUNE_C(0x0006FF), SC_ARAB},
+ {RUNE_C(0x000700), RUNE_C(0x00070D), SC_SYRC},
+ {RUNE_C(0x00070F), RUNE_C(0x00074A), SC_SYRC},
+ {RUNE_C(0x00074D), RUNE_C(0x00074F), SC_SYRC},
+ {RUNE_C(0x000750), RUNE_C(0x00077F), SC_ARAB},
+ {RUNE_C(0x000780), RUNE_C(0x0007B1), SC_THAA},
+ {RUNE_C(0x0007C0), RUNE_C(0x0007FA), SC_NKOO},
+ {RUNE_C(0x0007FD), RUNE_C(0x0007FF), SC_NKOO},
+ {RUNE_C(0x000800), RUNE_C(0x00082D), SC_SAMR},
+ {RUNE_C(0x000830), RUNE_C(0x00083E), SC_SAMR},
+ {RUNE_C(0x000840), RUNE_C(0x00085B), SC_MAND},
+ {RUNE_C(0x00085E), RUNE_C(0x00085E), SC_MAND},
+ {RUNE_C(0x000860), RUNE_C(0x00086A), SC_SYRC},
+ {RUNE_C(0x000870), RUNE_C(0x00088E), SC_ARAB},
+ {RUNE_C(0x000890), RUNE_C(0x000891), SC_ARAB},
+ {RUNE_C(0x000898), RUNE_C(0x0008E1), SC_ARAB},
+ {RUNE_C(0x0008E2), RUNE_C(0x0008E2), SC_ZYYY},
+ {RUNE_C(0x0008E3), RUNE_C(0x0008FF), SC_ARAB},
+ {RUNE_C(0x000900), RUNE_C(0x000950), SC_DEVA},
+ {RUNE_C(0x000951), RUNE_C(0x000954), SC_ZINH},
+ {RUNE_C(0x000955), RUNE_C(0x000963), SC_DEVA},
+ {RUNE_C(0x000964), RUNE_C(0x000965), SC_ZYYY},
+ {RUNE_C(0x000966), RUNE_C(0x00097F), SC_DEVA},
+ {RUNE_C(0x000980), RUNE_C(0x000983), SC_BENG},
+ {RUNE_C(0x000985), RUNE_C(0x00098C), SC_BENG},
+ {RUNE_C(0x00098F), RUNE_C(0x000990), SC_BENG},
+ {RUNE_C(0x000993), RUNE_C(0x0009A8), SC_BENG},
+ {RUNE_C(0x0009AA), RUNE_C(0x0009B0), SC_BENG},
+ {RUNE_C(0x0009B2), RUNE_C(0x0009B2), SC_BENG},
+ {RUNE_C(0x0009B6), RUNE_C(0x0009B9), SC_BENG},
+ {RUNE_C(0x0009BC), RUNE_C(0x0009C4), SC_BENG},
+ {RUNE_C(0x0009C7), RUNE_C(0x0009C8), SC_BENG},
+ {RUNE_C(0x0009CB), RUNE_C(0x0009CE), SC_BENG},
+ {RUNE_C(0x0009D7), RUNE_C(0x0009D7), SC_BENG},
+ {RUNE_C(0x0009DC), RUNE_C(0x0009DD), SC_BENG},
+ {RUNE_C(0x0009DF), RUNE_C(0x0009E3), SC_BENG},
+ {RUNE_C(0x0009E6), RUNE_C(0x0009FE), SC_BENG},
+ {RUNE_C(0x000A01), RUNE_C(0x000A03), SC_GURU},
+ {RUNE_C(0x000A05), RUNE_C(0x000A0A), SC_GURU},
+ {RUNE_C(0x000A0F), RUNE_C(0x000A10), SC_GURU},
+ {RUNE_C(0x000A13), RUNE_C(0x000A28), SC_GURU},
+ {RUNE_C(0x000A2A), RUNE_C(0x000A30), SC_GURU},
+ {RUNE_C(0x000A32), RUNE_C(0x000A33), SC_GURU},
+ {RUNE_C(0x000A35), RUNE_C(0x000A36), SC_GURU},
+ {RUNE_C(0x000A38), RUNE_C(0x000A39), SC_GURU},
+ {RUNE_C(0x000A3C), RUNE_C(0x000A3C), SC_GURU},
+ {RUNE_C(0x000A3E), RUNE_C(0x000A42), SC_GURU},
+ {RUNE_C(0x000A47), RUNE_C(0x000A48), SC_GURU},
+ {RUNE_C(0x000A4B), RUNE_C(0x000A4D), SC_GURU},
+ {RUNE_C(0x000A51), RUNE_C(0x000A51), SC_GURU},
+ {RUNE_C(0x000A59), RUNE_C(0x000A5C), SC_GURU},
+ {RUNE_C(0x000A5E), RUNE_C(0x000A5E), SC_GURU},
+ {RUNE_C(0x000A66), RUNE_C(0x000A76), SC_GURU},
+ {RUNE_C(0x000A81), RUNE_C(0x000A83), SC_GUJR},
+ {RUNE_C(0x000A85), RUNE_C(0x000A8D), SC_GUJR},
+ {RUNE_C(0x000A8F), RUNE_C(0x000A91), SC_GUJR},
+ {RUNE_C(0x000A93), RUNE_C(0x000AA8), SC_GUJR},
+ {RUNE_C(0x000AAA), RUNE_C(0x000AB0), SC_GUJR},
+ {RUNE_C(0x000AB2), RUNE_C(0x000AB3), SC_GUJR},
+ {RUNE_C(0x000AB5), RUNE_C(0x000AB9), SC_GUJR},
+ {RUNE_C(0x000ABC), RUNE_C(0x000AC5), SC_GUJR},
+ {RUNE_C(0x000AC7), RUNE_C(0x000AC9), SC_GUJR},
+ {RUNE_C(0x000ACB), RUNE_C(0x000ACD), SC_GUJR},
+ {RUNE_C(0x000AD0), RUNE_C(0x000AD0), SC_GUJR},
+ {RUNE_C(0x000AE0), RUNE_C(0x000AE3), SC_GUJR},
+ {RUNE_C(0x000AE6), RUNE_C(0x000AF1), SC_GUJR},
+ {RUNE_C(0x000AF9), RUNE_C(0x000AFF), SC_GUJR},
+ {RUNE_C(0x000B01), RUNE_C(0x000B03), SC_ORYA},
+ {RUNE_C(0x000B05), RUNE_C(0x000B0C), SC_ORYA},
+ {RUNE_C(0x000B0F), RUNE_C(0x000B10), SC_ORYA},
+ {RUNE_C(0x000B13), RUNE_C(0x000B28), SC_ORYA},
+ {RUNE_C(0x000B2A), RUNE_C(0x000B30), SC_ORYA},
+ {RUNE_C(0x000B32), RUNE_C(0x000B33), SC_ORYA},
+ {RUNE_C(0x000B35), RUNE_C(0x000B39), SC_ORYA},
+ {RUNE_C(0x000B3C), RUNE_C(0x000B44), SC_ORYA},
+ {RUNE_C(0x000B47), RUNE_C(0x000B48), SC_ORYA},
+ {RUNE_C(0x000B4B), RUNE_C(0x000B4D), SC_ORYA},
+ {RUNE_C(0x000B55), RUNE_C(0x000B57), SC_ORYA},
+ {RUNE_C(0x000B5C), RUNE_C(0x000B5D), SC_ORYA},
+ {RUNE_C(0x000B5F), RUNE_C(0x000B63), SC_ORYA},
+ {RUNE_C(0x000B66), RUNE_C(0x000B77), SC_ORYA},
+ {RUNE_C(0x000B82), RUNE_C(0x000B83), SC_TAML},
+ {RUNE_C(0x000B85), RUNE_C(0x000B8A), SC_TAML},
+ {RUNE_C(0x000B8E), RUNE_C(0x000B90), SC_TAML},
+ {RUNE_C(0x000B92), RUNE_C(0x000B95), SC_TAML},
+ {RUNE_C(0x000B99), RUNE_C(0x000B9A), SC_TAML},
+ {RUNE_C(0x000B9C), RUNE_C(0x000B9C), SC_TAML},
+ {RUNE_C(0x000B9E), RUNE_C(0x000B9F), SC_TAML},
+ {RUNE_C(0x000BA3), RUNE_C(0x000BA4), SC_TAML},
+ {RUNE_C(0x000BA8), RUNE_C(0x000BAA), SC_TAML},
+ {RUNE_C(0x000BAE), RUNE_C(0x000BB9), SC_TAML},
+ {RUNE_C(0x000BBE), RUNE_C(0x000BC2), SC_TAML},
+ {RUNE_C(0x000BC6), RUNE_C(0x000BC8), SC_TAML},
+ {RUNE_C(0x000BCA), RUNE_C(0x000BCD), SC_TAML},
+ {RUNE_C(0x000BD0), RUNE_C(0x000BD0), SC_TAML},
+ {RUNE_C(0x000BD7), RUNE_C(0x000BD7), SC_TAML},
+ {RUNE_C(0x000BE6), RUNE_C(0x000BFA), SC_TAML},
+ {RUNE_C(0x000C00), RUNE_C(0x000C0C), SC_TELU},
+ {RUNE_C(0x000C0E), RUNE_C(0x000C10), SC_TELU},
+ {RUNE_C(0x000C12), RUNE_C(0x000C28), SC_TELU},
+ {RUNE_C(0x000C2A), RUNE_C(0x000C39), SC_TELU},
+ {RUNE_C(0x000C3C), RUNE_C(0x000C44), SC_TELU},
+ {RUNE_C(0x000C46), RUNE_C(0x000C48), SC_TELU},
+ {RUNE_C(0x000C4A), RUNE_C(0x000C4D), SC_TELU},
+ {RUNE_C(0x000C55), RUNE_C(0x000C56), SC_TELU},
+ {RUNE_C(0x000C58), RUNE_C(0x000C5A), SC_TELU},
+ {RUNE_C(0x000C5D), RUNE_C(0x000C5D), SC_TELU},
+ {RUNE_C(0x000C60), RUNE_C(0x000C63), SC_TELU},
+ {RUNE_C(0x000C66), RUNE_C(0x000C6F), SC_TELU},
+ {RUNE_C(0x000C77), RUNE_C(0x000C7F), SC_TELU},
+ {RUNE_C(0x000C80), RUNE_C(0x000C8C), SC_KNDA},
+ {RUNE_C(0x000C8E), RUNE_C(0x000C90), SC_KNDA},
+ {RUNE_C(0x000C92), RUNE_C(0x000CA8), SC_KNDA},
+ {RUNE_C(0x000CAA), RUNE_C(0x000CB3), SC_KNDA},
+ {RUNE_C(0x000CB5), RUNE_C(0x000CB9), SC_KNDA},
+ {RUNE_C(0x000CBC), RUNE_C(0x000CC4), SC_KNDA},
+ {RUNE_C(0x000CC6), RUNE_C(0x000CC8), SC_KNDA},
+ {RUNE_C(0x000CCA), RUNE_C(0x000CCD), SC_KNDA},
+ {RUNE_C(0x000CD5), RUNE_C(0x000CD6), SC_KNDA},
+ {RUNE_C(0x000CDD), RUNE_C(0x000CDE), SC_KNDA},
+ {RUNE_C(0x000CE0), RUNE_C(0x000CE3), SC_KNDA},
+ {RUNE_C(0x000CE6), RUNE_C(0x000CEF), SC_KNDA},
+ {RUNE_C(0x000CF1), RUNE_C(0x000CF3), SC_KNDA},
+ {RUNE_C(0x000D00), RUNE_C(0x000D0C), SC_MLYM},
+ {RUNE_C(0x000D0E), RUNE_C(0x000D10), SC_MLYM},
+ {RUNE_C(0x000D12), RUNE_C(0x000D44), SC_MLYM},
+ {RUNE_C(0x000D46), RUNE_C(0x000D48), SC_MLYM},
+ {RUNE_C(0x000D4A), RUNE_C(0x000D4F), SC_MLYM},
+ {RUNE_C(0x000D54), RUNE_C(0x000D63), SC_MLYM},
+ {RUNE_C(0x000D66), RUNE_C(0x000D7F), SC_MLYM},
+ {RUNE_C(0x000D81), RUNE_C(0x000D83), SC_SINH},
+ {RUNE_C(0x000D85), RUNE_C(0x000D96), SC_SINH},
+ {RUNE_C(0x000D9A), RUNE_C(0x000DB1), SC_SINH},
+ {RUNE_C(0x000DB3), RUNE_C(0x000DBB), SC_SINH},
+ {RUNE_C(0x000DBD), RUNE_C(0x000DBD), SC_SINH},
+ {RUNE_C(0x000DC0), RUNE_C(0x000DC6), SC_SINH},
+ {RUNE_C(0x000DCA), RUNE_C(0x000DCA), SC_SINH},
+ {RUNE_C(0x000DCF), RUNE_C(0x000DD4), SC_SINH},
+ {RUNE_C(0x000DD6), RUNE_C(0x000DD6), SC_SINH},
+ {RUNE_C(0x000DD8), RUNE_C(0x000DDF), SC_SINH},
+ {RUNE_C(0x000DE6), RUNE_C(0x000DEF), SC_SINH},
+ {RUNE_C(0x000DF2), RUNE_C(0x000DF4), SC_SINH},
+ {RUNE_C(0x000E01), RUNE_C(0x000E3A), SC_THAI},
+ {RUNE_C(0x000E3F), RUNE_C(0x000E3F), SC_ZYYY},
+ {RUNE_C(0x000E40), RUNE_C(0x000E5B), SC_THAI},
+ {RUNE_C(0x000E81), RUNE_C(0x000E82), SC_LAOO},
+ {RUNE_C(0x000E84), RUNE_C(0x000E84), SC_LAOO},
+ {RUNE_C(0x000E86), RUNE_C(0x000E8A), SC_LAOO},
+ {RUNE_C(0x000E8C), RUNE_C(0x000EA3), SC_LAOO},
+ {RUNE_C(0x000EA5), RUNE_C(0x000EA5), SC_LAOO},
+ {RUNE_C(0x000EA7), RUNE_C(0x000EBD), SC_LAOO},
+ {RUNE_C(0x000EC0), RUNE_C(0x000EC4), SC_LAOO},
+ {RUNE_C(0x000EC6), RUNE_C(0x000EC6), SC_LAOO},
+ {RUNE_C(0x000EC8), RUNE_C(0x000ECE), SC_LAOO},
+ {RUNE_C(0x000ED0), RUNE_C(0x000ED9), SC_LAOO},
+ {RUNE_C(0x000EDC), RUNE_C(0x000EDF), SC_LAOO},
+ {RUNE_C(0x000F00), RUNE_C(0x000F47), SC_TIBT},
+ {RUNE_C(0x000F49), RUNE_C(0x000F6C), SC_TIBT},
+ {RUNE_C(0x000F71), RUNE_C(0x000F97), SC_TIBT},
+ {RUNE_C(0x000F99), RUNE_C(0x000FBC), SC_TIBT},
+ {RUNE_C(0x000FBE), RUNE_C(0x000FCC), SC_TIBT},
+ {RUNE_C(0x000FCE), RUNE_C(0x000FD4), SC_TIBT},
+ {RUNE_C(0x000FD5), RUNE_C(0x000FD8), SC_ZYYY},
+ {RUNE_C(0x000FD9), RUNE_C(0x000FDA), SC_TIBT},
+ {RUNE_C(0x001000), RUNE_C(0x00109F), SC_MYMR},
+ {RUNE_C(0x0010A0), RUNE_C(0x0010C5), SC_GEOR},
+ {RUNE_C(0x0010C7), RUNE_C(0x0010C7), SC_GEOR},
+ {RUNE_C(0x0010CD), RUNE_C(0x0010CD), SC_GEOR},
+ {RUNE_C(0x0010D0), RUNE_C(0x0010FA), SC_GEOR},
+ {RUNE_C(0x0010FB), RUNE_C(0x0010FB), SC_ZYYY},
+ {RUNE_C(0x0010FC), RUNE_C(0x0010FF), SC_GEOR},
+ {RUNE_C(0x001100), RUNE_C(0x0011FF), SC_HANG},
+ {RUNE_C(0x001200), RUNE_C(0x001248), SC_ETHI},
+ {RUNE_C(0x00124A), RUNE_C(0x00124D), SC_ETHI},
+ {RUNE_C(0x001250), RUNE_C(0x001256), SC_ETHI},
+ {RUNE_C(0x001258), RUNE_C(0x001258), SC_ETHI},
+ {RUNE_C(0x00125A), RUNE_C(0x00125D), SC_ETHI},
+ {RUNE_C(0x001260), RUNE_C(0x001288), SC_ETHI},
+ {RUNE_C(0x00128A), RUNE_C(0x00128D), SC_ETHI},
+ {RUNE_C(0x001290), RUNE_C(0x0012B0), SC_ETHI},
+ {RUNE_C(0x0012B2), RUNE_C(0x0012B5), SC_ETHI},
+ {RUNE_C(0x0012B8), RUNE_C(0x0012BE), SC_ETHI},
+ {RUNE_C(0x0012C0), RUNE_C(0x0012C0), SC_ETHI},
+ {RUNE_C(0x0012C2), RUNE_C(0x0012C5), SC_ETHI},
+ {RUNE_C(0x0012C8), RUNE_C(0x0012D6), SC_ETHI},
+ {RUNE_C(0x0012D8), RUNE_C(0x001310), SC_ETHI},
+ {RUNE_C(0x001312), RUNE_C(0x001315), SC_ETHI},
+ {RUNE_C(0x001318), RUNE_C(0x00135A), SC_ETHI},
+ {RUNE_C(0x00135D), RUNE_C(0x00137C), SC_ETHI},
+ {RUNE_C(0x001380), RUNE_C(0x001399), SC_ETHI},
+ {RUNE_C(0x0013A0), RUNE_C(0x0013F5), SC_CHER},
+ {RUNE_C(0x0013F8), RUNE_C(0x0013FD), SC_CHER},
+ {RUNE_C(0x001400), RUNE_C(0x00167F), SC_CANS},
+ {RUNE_C(0x001680), RUNE_C(0x00169C), SC_OGAM},
+ {RUNE_C(0x0016A0), RUNE_C(0x0016EA), SC_RUNR},
+ {RUNE_C(0x0016EB), RUNE_C(0x0016ED), SC_ZYYY},
+ {RUNE_C(0x0016EE), RUNE_C(0x0016F8), SC_RUNR},
+ {RUNE_C(0x001700), RUNE_C(0x001715), SC_TGLG},
+ {RUNE_C(0x00171F), RUNE_C(0x00171F), SC_TGLG},
+ {RUNE_C(0x001720), RUNE_C(0x001734), SC_HANO},
+ {RUNE_C(0x001735), RUNE_C(0x001736), SC_ZYYY},
+ {RUNE_C(0x001740), RUNE_C(0x001753), SC_BUHD},
+ {RUNE_C(0x001760), RUNE_C(0x00176C), SC_TAGB},
+ {RUNE_C(0x00176E), RUNE_C(0x001770), SC_TAGB},
+ {RUNE_C(0x001772), RUNE_C(0x001773), SC_TAGB},
+ {RUNE_C(0x001780), RUNE_C(0x0017DD), SC_KHMR},
+ {RUNE_C(0x0017E0), RUNE_C(0x0017E9), SC_KHMR},
+ {RUNE_C(0x0017F0), RUNE_C(0x0017F9), SC_KHMR},
+ {RUNE_C(0x001800), RUNE_C(0x001801), SC_MONG},
+ {RUNE_C(0x001802), RUNE_C(0x001803), SC_ZYYY},
+ {RUNE_C(0x001804), RUNE_C(0x001804), SC_MONG},
+ {RUNE_C(0x001805), RUNE_C(0x001805), SC_ZYYY},
+ {RUNE_C(0x001806), RUNE_C(0x001819), SC_MONG},
+ {RUNE_C(0x001820), RUNE_C(0x001878), SC_MONG},
+ {RUNE_C(0x001880), RUNE_C(0x0018AA), SC_MONG},
+ {RUNE_C(0x0018B0), RUNE_C(0x0018F5), SC_CANS},
+ {RUNE_C(0x001900), RUNE_C(0x00191E), SC_LIMB},
+ {RUNE_C(0x001920), RUNE_C(0x00192B), SC_LIMB},
+ {RUNE_C(0x001930), RUNE_C(0x00193B), SC_LIMB},
+ {RUNE_C(0x001940), RUNE_C(0x001940), SC_LIMB},
+ {RUNE_C(0x001944), RUNE_C(0x00194F), SC_LIMB},
+ {RUNE_C(0x001950), RUNE_C(0x00196D), SC_TALE},
+ {RUNE_C(0x001970), RUNE_C(0x001974), SC_TALE},
+ {RUNE_C(0x001980), RUNE_C(0x0019AB), SC_TALU},
+ {RUNE_C(0x0019B0), RUNE_C(0x0019C9), SC_TALU},
+ {RUNE_C(0x0019D0), RUNE_C(0x0019DA), SC_TALU},
+ {RUNE_C(0x0019DE), RUNE_C(0x0019DF), SC_TALU},
+ {RUNE_C(0x0019E0), RUNE_C(0x0019FF), SC_KHMR},
+ {RUNE_C(0x001A00), RUNE_C(0x001A1B), SC_BUGI},
+ {RUNE_C(0x001A1E), RUNE_C(0x001A1F), SC_BUGI},
+ {RUNE_C(0x001A20), RUNE_C(0x001A5E), SC_LANA},
+ {RUNE_C(0x001A60), RUNE_C(0x001A7C), SC_LANA},
+ {RUNE_C(0x001A7F), RUNE_C(0x001A89), SC_LANA},
+ {RUNE_C(0x001A90), RUNE_C(0x001A99), SC_LANA},
+ {RUNE_C(0x001AA0), RUNE_C(0x001AAD), SC_LANA},
+ {RUNE_C(0x001AB0), RUNE_C(0x001ACE), SC_ZINH},
+ {RUNE_C(0x001B00), RUNE_C(0x001B4C), SC_BALI},
+ {RUNE_C(0x001B50), RUNE_C(0x001B7E), SC_BALI},
+ {RUNE_C(0x001B80), RUNE_C(0x001BBF), SC_SUND},
+ {RUNE_C(0x001BC0), RUNE_C(0x001BF3), SC_BATK},
+ {RUNE_C(0x001BFC), RUNE_C(0x001BFF), SC_BATK},
+ {RUNE_C(0x001C00), RUNE_C(0x001C37), SC_LEPC},
+ {RUNE_C(0x001C3B), RUNE_C(0x001C49), SC_LEPC},
+ {RUNE_C(0x001C4D), RUNE_C(0x001C4F), SC_LEPC},
+ {RUNE_C(0x001C50), RUNE_C(0x001C7F), SC_OLCK},
+ {RUNE_C(0x001C80), RUNE_C(0x001C88), SC_CYRL},
+ {RUNE_C(0x001C90), RUNE_C(0x001CBA), SC_GEOR},
+ {RUNE_C(0x001CBD), RUNE_C(0x001CBF), SC_GEOR},
+ {RUNE_C(0x001CC0), RUNE_C(0x001CC7), SC_SUND},
+ {RUNE_C(0x001CD0), RUNE_C(0x001CD2), SC_ZINH},
+ {RUNE_C(0x001CD3), RUNE_C(0x001CD3), SC_ZYYY},
+ {RUNE_C(0x001CD4), RUNE_C(0x001CE0), SC_ZINH},
+ {RUNE_C(0x001CE1), RUNE_C(0x001CE1), SC_ZYYY},
+ {RUNE_C(0x001CE2), RUNE_C(0x001CE8), SC_ZINH},
+ {RUNE_C(0x001CE9), RUNE_C(0x001CEC), SC_ZYYY},
+ {RUNE_C(0x001CED), RUNE_C(0x001CED), SC_ZINH},
+ {RUNE_C(0x001CEE), RUNE_C(0x001CF3), SC_ZYYY},
+ {RUNE_C(0x001CF4), RUNE_C(0x001CF4), SC_ZINH},
+ {RUNE_C(0x001CF5), RUNE_C(0x001CF7), SC_ZYYY},
+ {RUNE_C(0x001CF8), RUNE_C(0x001CF9), SC_ZINH},
+ {RUNE_C(0x001CFA), RUNE_C(0x001CFA), SC_ZYYY},
+ {RUNE_C(0x001D00), RUNE_C(0x001D25), SC_LATN},
+ {RUNE_C(0x001D26), RUNE_C(0x001D2A), SC_GREK},
+ {RUNE_C(0x001D2B), RUNE_C(0x001D2B), SC_CYRL},
+ {RUNE_C(0x001D2C), RUNE_C(0x001D5C), SC_LATN},
+ {RUNE_C(0x001D5D), RUNE_C(0x001D61), SC_GREK},
+ {RUNE_C(0x001D62), RUNE_C(0x001D65), SC_LATN},
+ {RUNE_C(0x001D66), RUNE_C(0x001D6A), SC_GREK},
+ {RUNE_C(0x001D6B), RUNE_C(0x001D77), SC_LATN},
+ {RUNE_C(0x001D78), RUNE_C(0x001D78), SC_CYRL},
+ {RUNE_C(0x001D79), RUNE_C(0x001DBE), SC_LATN},
+ {RUNE_C(0x001DBF), RUNE_C(0x001DBF), SC_GREK},
+ {RUNE_C(0x001DC0), RUNE_C(0x001DFF), SC_ZINH},
+ {RUNE_C(0x001E00), RUNE_C(0x001EFF), SC_LATN},
+ {RUNE_C(0x001F00), RUNE_C(0x001F15), SC_GREK},
+ {RUNE_C(0x001F18), RUNE_C(0x001F1D), SC_GREK},
+ {RUNE_C(0x001F20), RUNE_C(0x001F45), SC_GREK},
+ {RUNE_C(0x001F48), RUNE_C(0x001F4D), SC_GREK},
+ {RUNE_C(0x001F50), RUNE_C(0x001F57), SC_GREK},
+ {RUNE_C(0x001F59), RUNE_C(0x001F59), SC_GREK},
+ {RUNE_C(0x001F5B), RUNE_C(0x001F5B), SC_GREK},
+ {RUNE_C(0x001F5D), RUNE_C(0x001F5D), SC_GREK},
+ {RUNE_C(0x001F5F), RUNE_C(0x001F7D), SC_GREK},
+ {RUNE_C(0x001F80), RUNE_C(0x001FB4), SC_GREK},
+ {RUNE_C(0x001FB6), RUNE_C(0x001FC4), SC_GREK},
+ {RUNE_C(0x001FC6), RUNE_C(0x001FD3), SC_GREK},
+ {RUNE_C(0x001FD6), RUNE_C(0x001FDB), SC_GREK},
+ {RUNE_C(0x001FDD), RUNE_C(0x001FEF), SC_GREK},
+ {RUNE_C(0x001FF2), RUNE_C(0x001FF4), SC_GREK},
+ {RUNE_C(0x001FF6), RUNE_C(0x001FFE), SC_GREK},
+ {RUNE_C(0x002000), RUNE_C(0x00200B), SC_ZYYY},
+ {RUNE_C(0x00200C), RUNE_C(0x00200D), SC_ZINH},
+ {RUNE_C(0x00200E), RUNE_C(0x002064), SC_ZYYY},
+ {RUNE_C(0x002066), RUNE_C(0x002070), SC_ZYYY},
+ {RUNE_C(0x002071), RUNE_C(0x002071), SC_LATN},
+ {RUNE_C(0x002074), RUNE_C(0x00207E), SC_ZYYY},
+ {RUNE_C(0x00207F), RUNE_C(0x00207F), SC_LATN},
+ {RUNE_C(0x002080), RUNE_C(0x00208E), SC_ZYYY},
+ {RUNE_C(0x002090), RUNE_C(0x00209C), SC_LATN},
+ {RUNE_C(0x0020A0), RUNE_C(0x0020C0), SC_ZYYY},
+ {RUNE_C(0x0020D0), RUNE_C(0x0020F0), SC_ZINH},
+ {RUNE_C(0x002100), RUNE_C(0x002125), SC_ZYYY},
+ {RUNE_C(0x002126), RUNE_C(0x002126), SC_GREK},
+ {RUNE_C(0x002127), RUNE_C(0x002129), SC_ZYYY},
+ {RUNE_C(0x00212A), RUNE_C(0x00212B), SC_LATN},
+ {RUNE_C(0x00212C), RUNE_C(0x002131), SC_ZYYY},
+ {RUNE_C(0x002132), RUNE_C(0x002132), SC_LATN},
+ {RUNE_C(0x002133), RUNE_C(0x00214D), SC_ZYYY},
+ {RUNE_C(0x00214E), RUNE_C(0x00214E), SC_LATN},
+ {RUNE_C(0x00214F), RUNE_C(0x00215F), SC_ZYYY},
+ {RUNE_C(0x002160), RUNE_C(0x002188), SC_LATN},
+ {RUNE_C(0x002189), RUNE_C(0x00218B), SC_ZYYY},
+ {RUNE_C(0x002190), RUNE_C(0x002426), SC_ZYYY},
+ {RUNE_C(0x002440), RUNE_C(0x00244A), SC_ZYYY},
+ {RUNE_C(0x002460), RUNE_C(0x0027FF), SC_ZYYY},
+ {RUNE_C(0x002800), RUNE_C(0x0028FF), SC_BRAI},
+ {RUNE_C(0x002900), RUNE_C(0x002B73), SC_ZYYY},
+ {RUNE_C(0x002B76), RUNE_C(0x002B95), SC_ZYYY},
+ {RUNE_C(0x002B97), RUNE_C(0x002BFF), SC_ZYYY},
+ {RUNE_C(0x002C00), RUNE_C(0x002C5F), SC_GLAG},
+ {RUNE_C(0x002C60), RUNE_C(0x002C7F), SC_LATN},
+ {RUNE_C(0x002C80), RUNE_C(0x002CF3), SC_COPT},
+ {RUNE_C(0x002CF9), RUNE_C(0x002CFF), SC_COPT},
+ {RUNE_C(0x002D00), RUNE_C(0x002D25), SC_GEOR},
+ {RUNE_C(0x002D27), RUNE_C(0x002D27), SC_GEOR},
+ {RUNE_C(0x002D2D), RUNE_C(0x002D2D), SC_GEOR},
+ {RUNE_C(0x002D30), RUNE_C(0x002D67), SC_TFNG},
+ {RUNE_C(0x002D6F), RUNE_C(0x002D70), SC_TFNG},
+ {RUNE_C(0x002D7F), RUNE_C(0x002D7F), SC_TFNG},
+ {RUNE_C(0x002D80), RUNE_C(0x002D96), SC_ETHI},
+ {RUNE_C(0x002DA0), RUNE_C(0x002DA6), SC_ETHI},
+ {RUNE_C(0x002DA8), RUNE_C(0x002DAE), SC_ETHI},
+ {RUNE_C(0x002DB0), RUNE_C(0x002DB6), SC_ETHI},
+ {RUNE_C(0x002DB8), RUNE_C(0x002DBE), SC_ETHI},
+ {RUNE_C(0x002DC0), RUNE_C(0x002DC6), SC_ETHI},
+ {RUNE_C(0x002DC8), RUNE_C(0x002DCE), SC_ETHI},
+ {RUNE_C(0x002DD0), RUNE_C(0x002DD6), SC_ETHI},
+ {RUNE_C(0x002DD8), RUNE_C(0x002DDE), SC_ETHI},
+ {RUNE_C(0x002DE0), RUNE_C(0x002DFF), SC_CYRL},
+ {RUNE_C(0x002E00), RUNE_C(0x002E5D), SC_ZYYY},
+ {RUNE_C(0x002E80), RUNE_C(0x002E99), SC_HANI},
+ {RUNE_C(0x002E9B), RUNE_C(0x002EF3), SC_HANI},
+ {RUNE_C(0x002F00), RUNE_C(0x002FD5), SC_HANI},
+ {RUNE_C(0x002FF0), RUNE_C(0x003004), SC_ZYYY},
+ {RUNE_C(0x003005), RUNE_C(0x003005), SC_HANI},
+ {RUNE_C(0x003006), RUNE_C(0x003006), SC_ZYYY},
+ {RUNE_C(0x003007), RUNE_C(0x003007), SC_HANI},
+ {RUNE_C(0x003008), RUNE_C(0x003020), SC_ZYYY},
+ {RUNE_C(0x003021), RUNE_C(0x003029), SC_HANI},
+ {RUNE_C(0x00302A), RUNE_C(0x00302D), SC_ZINH},
+ {RUNE_C(0x00302E), RUNE_C(0x00302F), SC_HANG},
+ {RUNE_C(0x003030), RUNE_C(0x003037), SC_ZYYY},
+ {RUNE_C(0x003038), RUNE_C(0x00303B), SC_HANI},
+ {RUNE_C(0x00303C), RUNE_C(0x00303F), SC_ZYYY},
+ {RUNE_C(0x003041), RUNE_C(0x003096), SC_HIRA},
+ {RUNE_C(0x003099), RUNE_C(0x00309A), SC_ZINH},
+ {RUNE_C(0x00309B), RUNE_C(0x00309C), SC_ZYYY},
+ {RUNE_C(0x00309D), RUNE_C(0x00309F), SC_HIRA},
+ {RUNE_C(0x0030A0), RUNE_C(0x0030A0), SC_ZYYY},
+ {RUNE_C(0x0030A1), RUNE_C(0x0030FA), SC_KANA},
+ {RUNE_C(0x0030FB), RUNE_C(0x0030FC), SC_ZYYY},
+ {RUNE_C(0x0030FD), RUNE_C(0x0030FF), SC_KANA},
+ {RUNE_C(0x003105), RUNE_C(0x00312F), SC_BOPO},
+ {RUNE_C(0x003131), RUNE_C(0x00318E), SC_HANG},
+ {RUNE_C(0x003190), RUNE_C(0x00319F), SC_ZYYY},
+ {RUNE_C(0x0031A0), RUNE_C(0x0031BF), SC_BOPO},
+ {RUNE_C(0x0031C0), RUNE_C(0x0031E3), SC_ZYYY},
+ {RUNE_C(0x0031EF), RUNE_C(0x0031EF), SC_ZYYY},
+ {RUNE_C(0x0031F0), RUNE_C(0x0031FF), SC_KANA},
+ {RUNE_C(0x003200), RUNE_C(0x00321E), SC_HANG},
+ {RUNE_C(0x003220), RUNE_C(0x00325F), SC_ZYYY},
+ {RUNE_C(0x003260), RUNE_C(0x00327E), SC_HANG},
+ {RUNE_C(0x00327F), RUNE_C(0x0032CF), SC_ZYYY},
+ {RUNE_C(0x0032D0), RUNE_C(0x0032FE), SC_KANA},
+ {RUNE_C(0x0032FF), RUNE_C(0x0032FF), SC_ZYYY},
+ {RUNE_C(0x003300), RUNE_C(0x003357), SC_KANA},
+ {RUNE_C(0x003358), RUNE_C(0x0033FF), SC_ZYYY},
+ {RUNE_C(0x003400), RUNE_C(0x004DBF), SC_HANI},
+ {RUNE_C(0x004DC0), RUNE_C(0x004DFF), SC_ZYYY},
+ {RUNE_C(0x004E00), RUNE_C(0x009FFF), SC_HANI},
+ {RUNE_C(0x00A000), RUNE_C(0x00A48C), SC_YIII},
+ {RUNE_C(0x00A490), RUNE_C(0x00A4C6), SC_YIII},
+ {RUNE_C(0x00A4D0), RUNE_C(0x00A4FF), SC_LISU},
+ {RUNE_C(0x00A500), RUNE_C(0x00A62B), SC_VAII},
+ {RUNE_C(0x00A640), RUNE_C(0x00A69F), SC_CYRL},
+ {RUNE_C(0x00A6A0), RUNE_C(0x00A6F7), SC_BAMU},
+ {RUNE_C(0x00A700), RUNE_C(0x00A721), SC_ZYYY},
+ {RUNE_C(0x00A722), RUNE_C(0x00A787), SC_LATN},
+ {RUNE_C(0x00A788), RUNE_C(0x00A78A), SC_ZYYY},
+ {RUNE_C(0x00A78B), RUNE_C(0x00A7CA), SC_LATN},
+ {RUNE_C(0x00A7D0), RUNE_C(0x00A7D1), SC_LATN},
+ {RUNE_C(0x00A7D3), RUNE_C(0x00A7D3), SC_LATN},
+ {RUNE_C(0x00A7D5), RUNE_C(0x00A7D9), SC_LATN},
+ {RUNE_C(0x00A7F2), RUNE_C(0x00A7FF), SC_LATN},
+ {RUNE_C(0x00A800), RUNE_C(0x00A82C), SC_SYLO},
+ {RUNE_C(0x00A830), RUNE_C(0x00A839), SC_ZYYY},
+ {RUNE_C(0x00A840), RUNE_C(0x00A877), SC_PHAG},
+ {RUNE_C(0x00A880), RUNE_C(0x00A8C5), SC_SAUR},
+ {RUNE_C(0x00A8CE), RUNE_C(0x00A8D9), SC_SAUR},
+ {RUNE_C(0x00A8E0), RUNE_C(0x00A8FF), SC_DEVA},
+ {RUNE_C(0x00A900), RUNE_C(0x00A92D), SC_KALI},
+ {RUNE_C(0x00A92E), RUNE_C(0x00A92E), SC_ZYYY},
+ {RUNE_C(0x00A92F), RUNE_C(0x00A92F), SC_KALI},
+ {RUNE_C(0x00A930), RUNE_C(0x00A953), SC_RJNG},
+ {RUNE_C(0x00A95F), RUNE_C(0x00A95F), SC_RJNG},
+ {RUNE_C(0x00A960), RUNE_C(0x00A97C), SC_HANG},
+ {RUNE_C(0x00A980), RUNE_C(0x00A9CD), SC_JAVA},
+ {RUNE_C(0x00A9CF), RUNE_C(0x00A9CF), SC_ZYYY},
+ {RUNE_C(0x00A9D0), RUNE_C(0x00A9D9), SC_JAVA},
+ {RUNE_C(0x00A9DE), RUNE_C(0x00A9DF), SC_JAVA},
+ {RUNE_C(0x00A9E0), RUNE_C(0x00A9FE), SC_MYMR},
+ {RUNE_C(0x00AA00), RUNE_C(0x00AA36), SC_CHAM},
+ {RUNE_C(0x00AA40), RUNE_C(0x00AA4D), SC_CHAM},
+ {RUNE_C(0x00AA50), RUNE_C(0x00AA59), SC_CHAM},
+ {RUNE_C(0x00AA5C), RUNE_C(0x00AA5F), SC_CHAM},
+ {RUNE_C(0x00AA60), RUNE_C(0x00AA7F), SC_MYMR},
+ {RUNE_C(0x00AA80), RUNE_C(0x00AAC2), SC_TAVT},
+ {RUNE_C(0x00AADB), RUNE_C(0x00AADF), SC_TAVT},
+ {RUNE_C(0x00AAE0), RUNE_C(0x00AAF6), SC_MTEI},
+ {RUNE_C(0x00AB01), RUNE_C(0x00AB06), SC_ETHI},
+ {RUNE_C(0x00AB09), RUNE_C(0x00AB0E), SC_ETHI},
+ {RUNE_C(0x00AB11), RUNE_C(0x00AB16), SC_ETHI},
+ {RUNE_C(0x00AB20), RUNE_C(0x00AB26), SC_ETHI},
+ {RUNE_C(0x00AB28), RUNE_C(0x00AB2E), SC_ETHI},
+ {RUNE_C(0x00AB30), RUNE_C(0x00AB5A), SC_LATN},
+ {RUNE_C(0x00AB5B), RUNE_C(0x00AB5B), SC_ZYYY},
+ {RUNE_C(0x00AB5C), RUNE_C(0x00AB64), SC_LATN},
+ {RUNE_C(0x00AB65), RUNE_C(0x00AB65), SC_GREK},
+ {RUNE_C(0x00AB66), RUNE_C(0x00AB69), SC_LATN},
+ {RUNE_C(0x00AB6A), RUNE_C(0x00AB6B), SC_ZYYY},
+ {RUNE_C(0x00AB70), RUNE_C(0x00ABBF), SC_CHER},
+ {RUNE_C(0x00ABC0), RUNE_C(0x00ABED), SC_MTEI},
+ {RUNE_C(0x00ABF0), RUNE_C(0x00ABF9), SC_MTEI},
+ {RUNE_C(0x00AC00), RUNE_C(0x00D7A3), SC_HANG},
+ {RUNE_C(0x00D7B0), RUNE_C(0x00D7C6), SC_HANG},
+ {RUNE_C(0x00D7CB), RUNE_C(0x00D7FB), SC_HANG},
+ {RUNE_C(0x00F900), RUNE_C(0x00FA6D), SC_HANI},
+ {RUNE_C(0x00FA70), RUNE_C(0x00FAD9), SC_HANI},
+ {RUNE_C(0x00FB00), RUNE_C(0x00FB06), SC_LATN},
+ {RUNE_C(0x00FB13), RUNE_C(0x00FB17), SC_ARMN},
+ {RUNE_C(0x00FB1D), RUNE_C(0x00FB36), SC_HEBR},
+ {RUNE_C(0x00FB38), RUNE_C(0x00FB3C), SC_HEBR},
+ {RUNE_C(0x00FB3E), RUNE_C(0x00FB3E), SC_HEBR},
+ {RUNE_C(0x00FB40), RUNE_C(0x00FB41), SC_HEBR},
+ {RUNE_C(0x00FB43), RUNE_C(0x00FB44), SC_HEBR},
+ {RUNE_C(0x00FB46), RUNE_C(0x00FB4F), SC_HEBR},
+ {RUNE_C(0x00FB50), RUNE_C(0x00FBC2), SC_ARAB},
+ {RUNE_C(0x00FBD3), RUNE_C(0x00FD3D), SC_ARAB},
+ {RUNE_C(0x00FD3E), RUNE_C(0x00FD3F), SC_ZYYY},
+ {RUNE_C(0x00FD40), RUNE_C(0x00FD8F), SC_ARAB},
+ {RUNE_C(0x00FD92), RUNE_C(0x00FDC7), SC_ARAB},
+ {RUNE_C(0x00FDCF), RUNE_C(0x00FDCF), SC_ARAB},
+ {RUNE_C(0x00FDF0), RUNE_C(0x00FDFF), SC_ARAB},
+ {RUNE_C(0x00FE00), RUNE_C(0x00FE0F), SC_ZINH},
+ {RUNE_C(0x00FE10), RUNE_C(0x00FE19), SC_ZYYY},
+ {RUNE_C(0x00FE20), RUNE_C(0x00FE2D), SC_ZINH},
+ {RUNE_C(0x00FE2E), RUNE_C(0x00FE2F), SC_CYRL},
+ {RUNE_C(0x00FE30), RUNE_C(0x00FE52), SC_ZYYY},
+ {RUNE_C(0x00FE54), RUNE_C(0x00FE66), SC_ZYYY},
+ {RUNE_C(0x00FE68), RUNE_C(0x00FE6B), SC_ZYYY},
+ {RUNE_C(0x00FE70), RUNE_C(0x00FE74), SC_ARAB},
+ {RUNE_C(0x00FE76), RUNE_C(0x00FEFC), SC_ARAB},
+ {RUNE_C(0x00FEFF), RUNE_C(0x00FEFF), SC_ZYYY},
+ {RUNE_C(0x00FF01), RUNE_C(0x00FF20), SC_ZYYY},
+ {RUNE_C(0x00FF21), RUNE_C(0x00FF3A), SC_LATN},
+ {RUNE_C(0x00FF3B), RUNE_C(0x00FF40), SC_ZYYY},
+ {RUNE_C(0x00FF41), RUNE_C(0x00FF5A), SC_LATN},
+ {RUNE_C(0x00FF5B), RUNE_C(0x00FF65), SC_ZYYY},
+ {RUNE_C(0x00FF66), RUNE_C(0x00FF6F), SC_KANA},
+ {RUNE_C(0x00FF70), RUNE_C(0x00FF70), SC_ZYYY},
+ {RUNE_C(0x00FF71), RUNE_C(0x00FF9D), SC_KANA},
+ {RUNE_C(0x00FF9E), RUNE_C(0x00FF9F), SC_ZYYY},
+ {RUNE_C(0x00FFA0), RUNE_C(0x00FFBE), SC_HANG},
+ {RUNE_C(0x00FFC2), RUNE_C(0x00FFC7), SC_HANG},
+ {RUNE_C(0x00FFCA), RUNE_C(0x00FFCF), SC_HANG},
+ {RUNE_C(0x00FFD2), RUNE_C(0x00FFD7), SC_HANG},
+ {RUNE_C(0x00FFDA), RUNE_C(0x00FFDC), SC_HANG},
+ {RUNE_C(0x00FFE0), RUNE_C(0x00FFE6), SC_ZYYY},
+ {RUNE_C(0x00FFE8), RUNE_C(0x00FFEE), SC_ZYYY},
+ {RUNE_C(0x00FFF9), RUNE_C(0x00FFFD), SC_ZYYY},
+ {RUNE_C(0x010000), RUNE_C(0x01000B), SC_LINB},
+ {RUNE_C(0x01000D), RUNE_C(0x010026), SC_LINB},
+ {RUNE_C(0x010028), RUNE_C(0x01003A), SC_LINB},
+ {RUNE_C(0x01003C), RUNE_C(0x01003D), SC_LINB},
+ {RUNE_C(0x01003F), RUNE_C(0x01004D), SC_LINB},
+ {RUNE_C(0x010050), RUNE_C(0x01005D), SC_LINB},
+ {RUNE_C(0x010080), RUNE_C(0x0100FA), SC_LINB},
+ {RUNE_C(0x010100), RUNE_C(0x010102), SC_ZYYY},
+ {RUNE_C(0x010107), RUNE_C(0x010133), SC_ZYYY},
+ {RUNE_C(0x010137), RUNE_C(0x01013F), SC_ZYYY},
+ {RUNE_C(0x010140), RUNE_C(0x01018E), SC_GREK},
+ {RUNE_C(0x010190), RUNE_C(0x01019C), SC_ZYYY},
+ {RUNE_C(0x0101A0), RUNE_C(0x0101A0), SC_GREK},
+ {RUNE_C(0x0101D0), RUNE_C(0x0101FC), SC_ZYYY},
+ {RUNE_C(0x0101FD), RUNE_C(0x0101FD), SC_ZINH},
+ {RUNE_C(0x010280), RUNE_C(0x01029C), SC_LYCI},
+ {RUNE_C(0x0102A0), RUNE_C(0x0102D0), SC_CARI},
+ {RUNE_C(0x0102E0), RUNE_C(0x0102E0), SC_ZINH},
+ {RUNE_C(0x0102E1), RUNE_C(0x0102FB), SC_ZYYY},
+ {RUNE_C(0x010300), RUNE_C(0x010323), SC_ITAL},
+ {RUNE_C(0x01032D), RUNE_C(0x01032F), SC_ITAL},
+ {RUNE_C(0x010330), RUNE_C(0x01034A), SC_GOTH},
+ {RUNE_C(0x010350), RUNE_C(0x01037A), SC_PERM},
+ {RUNE_C(0x010380), RUNE_C(0x01039D), SC_UGAR},
+ {RUNE_C(0x01039F), RUNE_C(0x01039F), SC_UGAR},
+ {RUNE_C(0x0103A0), RUNE_C(0x0103C3), SC_XPEO},
+ {RUNE_C(0x0103C8), RUNE_C(0x0103D5), SC_XPEO},
+ {RUNE_C(0x010400), RUNE_C(0x01044F), SC_DSRT},
+ {RUNE_C(0x010450), RUNE_C(0x01047F), SC_SHAW},
+ {RUNE_C(0x010480), RUNE_C(0x01049D), SC_OSMA},
+ {RUNE_C(0x0104A0), RUNE_C(0x0104A9), SC_OSMA},
+ {RUNE_C(0x0104B0), RUNE_C(0x0104D3), SC_OSGE},
+ {RUNE_C(0x0104D8), RUNE_C(0x0104FB), SC_OSGE},
+ {RUNE_C(0x010500), RUNE_C(0x010527), SC_ELBA},
+ {RUNE_C(0x010530), RUNE_C(0x010563), SC_AGHB},
+ {RUNE_C(0x01056F), RUNE_C(0x01056F), SC_AGHB},
+ {RUNE_C(0x010570), RUNE_C(0x01057A), SC_VITH},
+ {RUNE_C(0x01057C), RUNE_C(0x01058A), SC_VITH},
+ {RUNE_C(0x01058C), RUNE_C(0x010592), SC_VITH},
+ {RUNE_C(0x010594), RUNE_C(0x010595), SC_VITH},
+ {RUNE_C(0x010597), RUNE_C(0x0105A1), SC_VITH},
+ {RUNE_C(0x0105A3), RUNE_C(0x0105B1), SC_VITH},
+ {RUNE_C(0x0105B3), RUNE_C(0x0105B9), SC_VITH},
+ {RUNE_C(0x0105BB), RUNE_C(0x0105BC), SC_VITH},
+ {RUNE_C(0x010600), RUNE_C(0x010736), SC_LINA},
+ {RUNE_C(0x010740), RUNE_C(0x010755), SC_LINA},
+ {RUNE_C(0x010760), RUNE_C(0x010767), SC_LINA},
+ {RUNE_C(0x010780), RUNE_C(0x010785), SC_LATN},
+ {RUNE_C(0x010787), RUNE_C(0x0107B0), SC_LATN},
+ {RUNE_C(0x0107B2), RUNE_C(0x0107BA), SC_LATN},
+ {RUNE_C(0x010800), RUNE_C(0x010805), SC_CPRT},
+ {RUNE_C(0x010808), RUNE_C(0x010808), SC_CPRT},
+ {RUNE_C(0x01080A), RUNE_C(0x010835), SC_CPRT},
+ {RUNE_C(0x010837), RUNE_C(0x010838), SC_CPRT},
+ {RUNE_C(0x01083C), RUNE_C(0x01083C), SC_CPRT},
+ {RUNE_C(0x01083F), RUNE_C(0x01083F), SC_CPRT},
+ {RUNE_C(0x010840), RUNE_C(0x010855), SC_ARMI},
+ {RUNE_C(0x010857), RUNE_C(0x01085F), SC_ARMI},
+ {RUNE_C(0x010860), RUNE_C(0x01087F), SC_PALM},
+ {RUNE_C(0x010880), RUNE_C(0x01089E), SC_NBAT},
+ {RUNE_C(0x0108A7), RUNE_C(0x0108AF), SC_NBAT},
+ {RUNE_C(0x0108E0), RUNE_C(0x0108F2), SC_HATR},
+ {RUNE_C(0x0108F4), RUNE_C(0x0108F5), SC_HATR},
+ {RUNE_C(0x0108FB), RUNE_C(0x0108FF), SC_HATR},
+ {RUNE_C(0x010900), RUNE_C(0x01091B), SC_PHNX},
+ {RUNE_C(0x01091F), RUNE_C(0x01091F), SC_PHNX},
+ {RUNE_C(0x010920), RUNE_C(0x010939), SC_LYDI},
+ {RUNE_C(0x01093F), RUNE_C(0x01093F), SC_LYDI},
+ {RUNE_C(0x010980), RUNE_C(0x01099F), SC_MERO},
+ {RUNE_C(0x0109A0), RUNE_C(0x0109B7), SC_MERC},
+ {RUNE_C(0x0109BC), RUNE_C(0x0109CF), SC_MERC},
+ {RUNE_C(0x0109D2), RUNE_C(0x0109FF), SC_MERC},
+ {RUNE_C(0x010A00), RUNE_C(0x010A03), SC_KHAR},
+ {RUNE_C(0x010A05), RUNE_C(0x010A06), SC_KHAR},
+ {RUNE_C(0x010A0C), RUNE_C(0x010A13), SC_KHAR},
+ {RUNE_C(0x010A15), RUNE_C(0x010A17), SC_KHAR},
+ {RUNE_C(0x010A19), RUNE_C(0x010A35), SC_KHAR},
+ {RUNE_C(0x010A38), RUNE_C(0x010A3A), SC_KHAR},
+ {RUNE_C(0x010A3F), RUNE_C(0x010A48), SC_KHAR},
+ {RUNE_C(0x010A50), RUNE_C(0x010A58), SC_KHAR},
+ {RUNE_C(0x010A60), RUNE_C(0x010A7F), SC_SARB},
+ {RUNE_C(0x010A80), RUNE_C(0x010A9F), SC_NARB},
+ {RUNE_C(0x010AC0), RUNE_C(0x010AE6), SC_MANI},
+ {RUNE_C(0x010AEB), RUNE_C(0x010AF6), SC_MANI},
+ {RUNE_C(0x010B00), RUNE_C(0x010B35), SC_AVST},
+ {RUNE_C(0x010B39), RUNE_C(0x010B3F), SC_AVST},
+ {RUNE_C(0x010B40), RUNE_C(0x010B55), SC_PRTI},
+ {RUNE_C(0x010B58), RUNE_C(0x010B5F), SC_PRTI},
+ {RUNE_C(0x010B60), RUNE_C(0x010B72), SC_PHLI},
+ {RUNE_C(0x010B78), RUNE_C(0x010B7F), SC_PHLI},
+ {RUNE_C(0x010B80), RUNE_C(0x010B91), SC_PHLP},
+ {RUNE_C(0x010B99), RUNE_C(0x010B9C), SC_PHLP},
+ {RUNE_C(0x010BA9), RUNE_C(0x010BAF), SC_PHLP},
+ {RUNE_C(0x010C00), RUNE_C(0x010C48), SC_ORKH},
+ {RUNE_C(0x010C80), RUNE_C(0x010CB2), SC_HUNG},
+ {RUNE_C(0x010CC0), RUNE_C(0x010CF2), SC_HUNG},
+ {RUNE_C(0x010CFA), RUNE_C(0x010CFF), SC_HUNG},
+ {RUNE_C(0x010D00), RUNE_C(0x010D27), SC_ROHG},
+ {RUNE_C(0x010D30), RUNE_C(0x010D39), SC_ROHG},
+ {RUNE_C(0x010E60), RUNE_C(0x010E7E), SC_ARAB},
+ {RUNE_C(0x010E80), RUNE_C(0x010EA9), SC_YEZI},
+ {RUNE_C(0x010EAB), RUNE_C(0x010EAD), SC_YEZI},
+ {RUNE_C(0x010EB0), RUNE_C(0x010EB1), SC_YEZI},
+ {RUNE_C(0x010EFD), RUNE_C(0x010EFF), SC_ARAB},
+ {RUNE_C(0x010F00), RUNE_C(0x010F27), SC_SOGO},
+ {RUNE_C(0x010F30), RUNE_C(0x010F59), SC_SOGD},
+ {RUNE_C(0x010F70), RUNE_C(0x010F89), SC_OUGR},
+ {RUNE_C(0x010FB0), RUNE_C(0x010FCB), SC_CHRS},
+ {RUNE_C(0x010FE0), RUNE_C(0x010FF6), SC_ELYM},
+ {RUNE_C(0x011000), RUNE_C(0x01104D), SC_BRAH},
+ {RUNE_C(0x011052), RUNE_C(0x011075), SC_BRAH},
+ {RUNE_C(0x01107F), RUNE_C(0x01107F), SC_BRAH},
+ {RUNE_C(0x011080), RUNE_C(0x0110C2), SC_KTHI},
+ {RUNE_C(0x0110CD), RUNE_C(0x0110CD), SC_KTHI},
+ {RUNE_C(0x0110D0), RUNE_C(0x0110E8), SC_SORA},
+ {RUNE_C(0x0110F0), RUNE_C(0x0110F9), SC_SORA},
+ {RUNE_C(0x011100), RUNE_C(0x011134), SC_CAKM},
+ {RUNE_C(0x011136), RUNE_C(0x011147), SC_CAKM},
+ {RUNE_C(0x011150), RUNE_C(0x011176), SC_MAHJ},
+ {RUNE_C(0x011180), RUNE_C(0x0111DF), SC_SHRD},
+ {RUNE_C(0x0111E1), RUNE_C(0x0111F4), SC_SINH},
+ {RUNE_C(0x011200), RUNE_C(0x011211), SC_KHOJ},
+ {RUNE_C(0x011213), RUNE_C(0x011241), SC_KHOJ},
+ {RUNE_C(0x011280), RUNE_C(0x011286), SC_MULT},
+ {RUNE_C(0x011288), RUNE_C(0x011288), SC_MULT},
+ {RUNE_C(0x01128A), RUNE_C(0x01128D), SC_MULT},
+ {RUNE_C(0x01128F), RUNE_C(0x01129D), SC_MULT},
+ {RUNE_C(0x01129F), RUNE_C(0x0112A9), SC_MULT},
+ {RUNE_C(0x0112B0), RUNE_C(0x0112EA), SC_SIND},
+ {RUNE_C(0x0112F0), RUNE_C(0x0112F9), SC_SIND},
+ {RUNE_C(0x011300), RUNE_C(0x011303), SC_GRAN},
+ {RUNE_C(0x011305), RUNE_C(0x01130C), SC_GRAN},
+ {RUNE_C(0x01130F), RUNE_C(0x011310), SC_GRAN},
+ {RUNE_C(0x011313), RUNE_C(0x011328), SC_GRAN},
+ {RUNE_C(0x01132A), RUNE_C(0x011330), SC_GRAN},
+ {RUNE_C(0x011332), RUNE_C(0x011333), SC_GRAN},
+ {RUNE_C(0x011335), RUNE_C(0x011339), SC_GRAN},
+ {RUNE_C(0x01133B), RUNE_C(0x01133B), SC_ZINH},
+ {RUNE_C(0x01133C), RUNE_C(0x011344), SC_GRAN},
+ {RUNE_C(0x011347), RUNE_C(0x011348), SC_GRAN},
+ {RUNE_C(0x01134B), RUNE_C(0x01134D), SC_GRAN},
+ {RUNE_C(0x011350), RUNE_C(0x011350), SC_GRAN},
+ {RUNE_C(0x011357), RUNE_C(0x011357), SC_GRAN},
+ {RUNE_C(0x01135D), RUNE_C(0x011363), SC_GRAN},
+ {RUNE_C(0x011366), RUNE_C(0x01136C), SC_GRAN},
+ {RUNE_C(0x011370), RUNE_C(0x011374), SC_GRAN},
+ {RUNE_C(0x011400), RUNE_C(0x01145B), SC_NEWA},
+ {RUNE_C(0x01145D), RUNE_C(0x011461), SC_NEWA},
+ {RUNE_C(0x011480), RUNE_C(0x0114C7), SC_TIRH},
+ {RUNE_C(0x0114D0), RUNE_C(0x0114D9), SC_TIRH},
+ {RUNE_C(0x011580), RUNE_C(0x0115B5), SC_SIDD},
+ {RUNE_C(0x0115B8), RUNE_C(0x0115DD), SC_SIDD},
+ {RUNE_C(0x011600), RUNE_C(0x011644), SC_MODI},
+ {RUNE_C(0x011650), RUNE_C(0x011659), SC_MODI},
+ {RUNE_C(0x011660), RUNE_C(0x01166C), SC_MONG},
+ {RUNE_C(0x011680), RUNE_C(0x0116B9), SC_TAKR},
+ {RUNE_C(0x0116C0), RUNE_C(0x0116C9), SC_TAKR},
+ {RUNE_C(0x011700), RUNE_C(0x01171A), SC_AHOM},
+ {RUNE_C(0x01171D), RUNE_C(0x01172B), SC_AHOM},
+ {RUNE_C(0x011730), RUNE_C(0x011746), SC_AHOM},
+ {RUNE_C(0x011800), RUNE_C(0x01183B), SC_DOGR},
+ {RUNE_C(0x0118A0), RUNE_C(0x0118F2), SC_WARA},
+ {RUNE_C(0x0118FF), RUNE_C(0x0118FF), SC_WARA},
+ {RUNE_C(0x011900), RUNE_C(0x011906), SC_DIAK},
+ {RUNE_C(0x011909), RUNE_C(0x011909), SC_DIAK},
+ {RUNE_C(0x01190C), RUNE_C(0x011913), SC_DIAK},
+ {RUNE_C(0x011915), RUNE_C(0x011916), SC_DIAK},
+ {RUNE_C(0x011918), RUNE_C(0x011935), SC_DIAK},
+ {RUNE_C(0x011937), RUNE_C(0x011938), SC_DIAK},
+ {RUNE_C(0x01193B), RUNE_C(0x011946), SC_DIAK},
+ {RUNE_C(0x011950), RUNE_C(0x011959), SC_DIAK},
+ {RUNE_C(0x0119A0), RUNE_C(0x0119A7), SC_NAND},
+ {RUNE_C(0x0119AA), RUNE_C(0x0119D7), SC_NAND},
+ {RUNE_C(0x0119DA), RUNE_C(0x0119E4), SC_NAND},
+ {RUNE_C(0x011A00), RUNE_C(0x011A47), SC_ZANB},
+ {RUNE_C(0x011A50), RUNE_C(0x011AA2), SC_SOYO},
+ {RUNE_C(0x011AB0), RUNE_C(0x011ABF), SC_CANS},
+ {RUNE_C(0x011AC0), RUNE_C(0x011AF8), SC_PAUC},
+ {RUNE_C(0x011B00), RUNE_C(0x011B09), SC_DEVA},
+ {RUNE_C(0x011C00), RUNE_C(0x011C08), SC_BHKS},
+ {RUNE_C(0x011C0A), RUNE_C(0x011C36), SC_BHKS},
+ {RUNE_C(0x011C38), RUNE_C(0x011C45), SC_BHKS},
+ {RUNE_C(0x011C50), RUNE_C(0x011C6C), SC_BHKS},
+ {RUNE_C(0x011C70), RUNE_C(0x011C8F), SC_MARC},
+ {RUNE_C(0x011C92), RUNE_C(0x011CA7), SC_MARC},
+ {RUNE_C(0x011CA9), RUNE_C(0x011CB6), SC_MARC},
+ {RUNE_C(0x011D00), RUNE_C(0x011D06), SC_GONM},
+ {RUNE_C(0x011D08), RUNE_C(0x011D09), SC_GONM},
+ {RUNE_C(0x011D0B), RUNE_C(0x011D36), SC_GONM},
+ {RUNE_C(0x011D3A), RUNE_C(0x011D3A), SC_GONM},
+ {RUNE_C(0x011D3C), RUNE_C(0x011D3D), SC_GONM},
+ {RUNE_C(0x011D3F), RUNE_C(0x011D47), SC_GONM},
+ {RUNE_C(0x011D50), RUNE_C(0x011D59), SC_GONM},
+ {RUNE_C(0x011D60), RUNE_C(0x011D65), SC_GONG},
+ {RUNE_C(0x011D67), RUNE_C(0x011D68), SC_GONG},
+ {RUNE_C(0x011D6A), RUNE_C(0x011D8E), SC_GONG},
+ {RUNE_C(0x011D90), RUNE_C(0x011D91), SC_GONG},
+ {RUNE_C(0x011D93), RUNE_C(0x011D98), SC_GONG},
+ {RUNE_C(0x011DA0), RUNE_C(0x011DA9), SC_GONG},
+ {RUNE_C(0x011EE0), RUNE_C(0x011EF8), SC_MAKA},
+ {RUNE_C(0x011F00), RUNE_C(0x011F10), SC_KAWI},
+ {RUNE_C(0x011F12), RUNE_C(0x011F3A), SC_KAWI},
+ {RUNE_C(0x011F3E), RUNE_C(0x011F59), SC_KAWI},
+ {RUNE_C(0x011FB0), RUNE_C(0x011FB0), SC_LISU},
+ {RUNE_C(0x011FC0), RUNE_C(0x011FF1), SC_TAML},
+ {RUNE_C(0x011FFF), RUNE_C(0x011FFF), SC_TAML},
+ {RUNE_C(0x012000), RUNE_C(0x012399), SC_XSUX},
+ {RUNE_C(0x012400), RUNE_C(0x01246E), SC_XSUX},
+ {RUNE_C(0x012470), RUNE_C(0x012474), SC_XSUX},
+ {RUNE_C(0x012480), RUNE_C(0x012543), SC_XSUX},
+ {RUNE_C(0x012F90), RUNE_C(0x012FF2), SC_CPMN},
+ {RUNE_C(0x013000), RUNE_C(0x013455), SC_EGYP},
+ {RUNE_C(0x014400), RUNE_C(0x014646), SC_HLUW},
+ {RUNE_C(0x016800), RUNE_C(0x016A38), SC_BAMU},
+ {RUNE_C(0x016A40), RUNE_C(0x016A5E), SC_MROO},
+ {RUNE_C(0x016A60), RUNE_C(0x016A69), SC_MROO},
+ {RUNE_C(0x016A6E), RUNE_C(0x016A6F), SC_MROO},
+ {RUNE_C(0x016A70), RUNE_C(0x016ABE), SC_TNSA},
+ {RUNE_C(0x016AC0), RUNE_C(0x016AC9), SC_TNSA},
+ {RUNE_C(0x016AD0), RUNE_C(0x016AED), SC_BASS},
+ {RUNE_C(0x016AF0), RUNE_C(0x016AF5), SC_BASS},
+ {RUNE_C(0x016B00), RUNE_C(0x016B45), SC_HMNG},
+ {RUNE_C(0x016B50), RUNE_C(0x016B59), SC_HMNG},
+ {RUNE_C(0x016B5B), RUNE_C(0x016B61), SC_HMNG},
+ {RUNE_C(0x016B63), RUNE_C(0x016B77), SC_HMNG},
+ {RUNE_C(0x016B7D), RUNE_C(0x016B8F), SC_HMNG},
+ {RUNE_C(0x016E40), RUNE_C(0x016E9A), SC_MEDF},
+ {RUNE_C(0x016F00), RUNE_C(0x016F4A), SC_PLRD},
+ {RUNE_C(0x016F4F), RUNE_C(0x016F87), SC_PLRD},
+ {RUNE_C(0x016F8F), RUNE_C(0x016F9F), SC_PLRD},
+ {RUNE_C(0x016FE0), RUNE_C(0x016FE0), SC_TANG},
+ {RUNE_C(0x016FE1), RUNE_C(0x016FE1), SC_NSHU},
+ {RUNE_C(0x016FE2), RUNE_C(0x016FE3), SC_HANI},
+ {RUNE_C(0x016FE4), RUNE_C(0x016FE4), SC_KITS},
+ {RUNE_C(0x016FF0), RUNE_C(0x016FF1), SC_HANI},
+ {RUNE_C(0x017000), RUNE_C(0x0187F7), SC_TANG},
+ {RUNE_C(0x018800), RUNE_C(0x018AFF), SC_TANG},
+ {RUNE_C(0x018B00), RUNE_C(0x018CD5), SC_KITS},
+ {RUNE_C(0x018D00), RUNE_C(0x018D08), SC_TANG},
+ {RUNE_C(0x01AFF0), RUNE_C(0x01AFF3), SC_KANA},
+ {RUNE_C(0x01AFF5), RUNE_C(0x01AFFB), SC_KANA},
+ {RUNE_C(0x01AFFD), RUNE_C(0x01AFFE), SC_KANA},
+ {RUNE_C(0x01B000), RUNE_C(0x01B000), SC_KANA},
+ {RUNE_C(0x01B001), RUNE_C(0x01B11F), SC_HIRA},
+ {RUNE_C(0x01B120), RUNE_C(0x01B122), SC_KANA},
+ {RUNE_C(0x01B132), RUNE_C(0x01B132), SC_HIRA},
+ {RUNE_C(0x01B150), RUNE_C(0x01B152), SC_HIRA},
+ {RUNE_C(0x01B155), RUNE_C(0x01B155), SC_KANA},
+ {RUNE_C(0x01B164), RUNE_C(0x01B167), SC_KANA},
+ {RUNE_C(0x01B170), RUNE_C(0x01B2FB), SC_NSHU},
+ {RUNE_C(0x01BC00), RUNE_C(0x01BC6A), SC_DUPL},
+ {RUNE_C(0x01BC70), RUNE_C(0x01BC7C), SC_DUPL},
+ {RUNE_C(0x01BC80), RUNE_C(0x01BC88), SC_DUPL},
+ {RUNE_C(0x01BC90), RUNE_C(0x01BC99), SC_DUPL},
+ {RUNE_C(0x01BC9C), RUNE_C(0x01BC9F), SC_DUPL},
+ {RUNE_C(0x01BCA0), RUNE_C(0x01BCA3), SC_ZYYY},
+ {RUNE_C(0x01CF00), RUNE_C(0x01CF2D), SC_ZINH},
+ {RUNE_C(0x01CF30), RUNE_C(0x01CF46), SC_ZINH},
+ {RUNE_C(0x01CF50), RUNE_C(0x01CFC3), SC_ZYYY},
+ {RUNE_C(0x01D000), RUNE_C(0x01D0F5), SC_ZYYY},
+ {RUNE_C(0x01D100), RUNE_C(0x01D126), SC_ZYYY},
+ {RUNE_C(0x01D129), RUNE_C(0x01D166), SC_ZYYY},
+ {RUNE_C(0x01D167), RUNE_C(0x01D169), SC_ZINH},
+ {RUNE_C(0x01D16A), RUNE_C(0x01D17A), SC_ZYYY},
+ {RUNE_C(0x01D17B), RUNE_C(0x01D182), SC_ZINH},
+ {RUNE_C(0x01D183), RUNE_C(0x01D184), SC_ZYYY},
+ {RUNE_C(0x01D185), RUNE_C(0x01D18B), SC_ZINH},
+ {RUNE_C(0x01D18C), RUNE_C(0x01D1A9), SC_ZYYY},
+ {RUNE_C(0x01D1AA), RUNE_C(0x01D1AD), SC_ZINH},
+ {RUNE_C(0x01D1AE), RUNE_C(0x01D1EA), SC_ZYYY},
+ {RUNE_C(0x01D200), RUNE_C(0x01D245), SC_GREK},
+ {RUNE_C(0x01D2C0), RUNE_C(0x01D2D3), SC_ZYYY},
+ {RUNE_C(0x01D2E0), RUNE_C(0x01D2F3), SC_ZYYY},
+ {RUNE_C(0x01D300), RUNE_C(0x01D356), SC_ZYYY},
+ {RUNE_C(0x01D360), RUNE_C(0x01D378), SC_ZYYY},
+ {RUNE_C(0x01D400), RUNE_C(0x01D454), SC_ZYYY},
+ {RUNE_C(0x01D456), RUNE_C(0x01D49C), SC_ZYYY},
+ {RUNE_C(0x01D49E), RUNE_C(0x01D49F), SC_ZYYY},
+ {RUNE_C(0x01D4A2), RUNE_C(0x01D4A2), SC_ZYYY},
+ {RUNE_C(0x01D4A5), RUNE_C(0x01D4A6), SC_ZYYY},
+ {RUNE_C(0x01D4A9), RUNE_C(0x01D4AC), SC_ZYYY},
+ {RUNE_C(0x01D4AE), RUNE_C(0x01D4B9), SC_ZYYY},
+ {RUNE_C(0x01D4BB), RUNE_C(0x01D4BB), SC_ZYYY},
+ {RUNE_C(0x01D4BD), RUNE_C(0x01D4C3), SC_ZYYY},
+ {RUNE_C(0x01D4C5), RUNE_C(0x01D505), SC_ZYYY},
+ {RUNE_C(0x01D507), RUNE_C(0x01D50A), SC_ZYYY},
+ {RUNE_C(0x01D50D), RUNE_C(0x01D514), SC_ZYYY},
+ {RUNE_C(0x01D516), RUNE_C(0x01D51C), SC_ZYYY},
+ {RUNE_C(0x01D51E), RUNE_C(0x01D539), SC_ZYYY},
+ {RUNE_C(0x01D53B), RUNE_C(0x01D53E), SC_ZYYY},
+ {RUNE_C(0x01D540), RUNE_C(0x01D544), SC_ZYYY},
+ {RUNE_C(0x01D546), RUNE_C(0x01D546), SC_ZYYY},
+ {RUNE_C(0x01D54A), RUNE_C(0x01D550), SC_ZYYY},
+ {RUNE_C(0x01D552), RUNE_C(0x01D6A5), SC_ZYYY},
+ {RUNE_C(0x01D6A8), RUNE_C(0x01D7CB), SC_ZYYY},
+ {RUNE_C(0x01D7CE), RUNE_C(0x01D7FF), SC_ZYYY},
+ {RUNE_C(0x01D800), RUNE_C(0x01DA8B), SC_SGNW},
+ {RUNE_C(0x01DA9B), RUNE_C(0x01DA9F), SC_SGNW},
+ {RUNE_C(0x01DAA1), RUNE_C(0x01DAAF), SC_SGNW},
+ {RUNE_C(0x01DF00), RUNE_C(0x01DF1E), SC_LATN},
+ {RUNE_C(0x01DF25), RUNE_C(0x01DF2A), SC_LATN},
+ {RUNE_C(0x01E000), RUNE_C(0x01E006), SC_GLAG},
+ {RUNE_C(0x01E008), RUNE_C(0x01E018), SC_GLAG},
+ {RUNE_C(0x01E01B), RUNE_C(0x01E021), SC_GLAG},
+ {RUNE_C(0x01E023), RUNE_C(0x01E024), SC_GLAG},
+ {RUNE_C(0x01E026), RUNE_C(0x01E02A), SC_GLAG},
+ {RUNE_C(0x01E030), RUNE_C(0x01E06D), SC_CYRL},
+ {RUNE_C(0x01E08F), RUNE_C(0x01E08F), SC_CYRL},
+ {RUNE_C(0x01E100), RUNE_C(0x01E12C), SC_HMNP},
+ {RUNE_C(0x01E130), RUNE_C(0x01E13D), SC_HMNP},
+ {RUNE_C(0x01E140), RUNE_C(0x01E149), SC_HMNP},
+ {RUNE_C(0x01E14E), RUNE_C(0x01E14F), SC_HMNP},
+ {RUNE_C(0x01E290), RUNE_C(0x01E2AE), SC_TOTO},
+ {RUNE_C(0x01E2C0), RUNE_C(0x01E2F9), SC_WCHO},
+ {RUNE_C(0x01E2FF), RUNE_C(0x01E2FF), SC_WCHO},
+ {RUNE_C(0x01E4D0), RUNE_C(0x01E4F9), SC_NAGM},
+ {RUNE_C(0x01E7E0), RUNE_C(0x01E7E6), SC_ETHI},
+ {RUNE_C(0x01E7E8), RUNE_C(0x01E7EB), SC_ETHI},
+ {RUNE_C(0x01E7ED), RUNE_C(0x01E7EE), SC_ETHI},
+ {RUNE_C(0x01E7F0), RUNE_C(0x01E7FE), SC_ETHI},
+ {RUNE_C(0x01E800), RUNE_C(0x01E8C4), SC_MEND},
+ {RUNE_C(0x01E8C7), RUNE_C(0x01E8D6), SC_MEND},
+ {RUNE_C(0x01E900), RUNE_C(0x01E94B), SC_ADLM},
+ {RUNE_C(0x01E950), RUNE_C(0x01E959), SC_ADLM},
+ {RUNE_C(0x01E95E), RUNE_C(0x01E95F), SC_ADLM},
+ {RUNE_C(0x01EC71), RUNE_C(0x01ECB4), SC_ZYYY},
+ {RUNE_C(0x01ED01), RUNE_C(0x01ED3D), SC_ZYYY},
+ {RUNE_C(0x01EE00), RUNE_C(0x01EE03), SC_ARAB},
+ {RUNE_C(0x01EE05), RUNE_C(0x01EE1F), SC_ARAB},
+ {RUNE_C(0x01EE21), RUNE_C(0x01EE22), SC_ARAB},
+ {RUNE_C(0x01EE24), RUNE_C(0x01EE24), SC_ARAB},
+ {RUNE_C(0x01EE27), RUNE_C(0x01EE27), SC_ARAB},
+ {RUNE_C(0x01EE29), RUNE_C(0x01EE32), SC_ARAB},
+ {RUNE_C(0x01EE34), RUNE_C(0x01EE37), SC_ARAB},
+ {RUNE_C(0x01EE39), RUNE_C(0x01EE39), SC_ARAB},
+ {RUNE_C(0x01EE3B), RUNE_C(0x01EE3B), SC_ARAB},
+ {RUNE_C(0x01EE42), RUNE_C(0x01EE42), SC_ARAB},
+ {RUNE_C(0x01EE47), RUNE_C(0x01EE47), SC_ARAB},
+ {RUNE_C(0x01EE49), RUNE_C(0x01EE49), SC_ARAB},
+ {RUNE_C(0x01EE4B), RUNE_C(0x01EE4B), SC_ARAB},
+ {RUNE_C(0x01EE4D), RUNE_C(0x01EE4F), SC_ARAB},
+ {RUNE_C(0x01EE51), RUNE_C(0x01EE52), SC_ARAB},
+ {RUNE_C(0x01EE54), RUNE_C(0x01EE54), SC_ARAB},
+ {RUNE_C(0x01EE57), RUNE_C(0x01EE57), SC_ARAB},
+ {RUNE_C(0x01EE59), RUNE_C(0x01EE59), SC_ARAB},
+ {RUNE_C(0x01EE5B), RUNE_C(0x01EE5B), SC_ARAB},
+ {RUNE_C(0x01EE5D), RUNE_C(0x01EE5D), SC_ARAB},
+ {RUNE_C(0x01EE5F), RUNE_C(0x01EE5F), SC_ARAB},
+ {RUNE_C(0x01EE61), RUNE_C(0x01EE62), SC_ARAB},
+ {RUNE_C(0x01EE64), RUNE_C(0x01EE64), SC_ARAB},
+ {RUNE_C(0x01EE67), RUNE_C(0x01EE6A), SC_ARAB},
+ {RUNE_C(0x01EE6C), RUNE_C(0x01EE72), SC_ARAB},
+ {RUNE_C(0x01EE74), RUNE_C(0x01EE77), SC_ARAB},
+ {RUNE_C(0x01EE79), RUNE_C(0x01EE7C), SC_ARAB},
+ {RUNE_C(0x01EE7E), RUNE_C(0x01EE7E), SC_ARAB},
+ {RUNE_C(0x01EE80), RUNE_C(0x01EE89), SC_ARAB},
+ {RUNE_C(0x01EE8B), RUNE_C(0x01EE9B), SC_ARAB},
+ {RUNE_C(0x01EEA1), RUNE_C(0x01EEA3), SC_ARAB},
+ {RUNE_C(0x01EEA5), RUNE_C(0x01EEA9), SC_ARAB},
+ {RUNE_C(0x01EEAB), RUNE_C(0x01EEBB), SC_ARAB},
+ {RUNE_C(0x01EEF0), RUNE_C(0x01EEF1), SC_ARAB},
+ {RUNE_C(0x01F000), RUNE_C(0x01F02B), SC_ZYYY},
+ {RUNE_C(0x01F030), RUNE_C(0x01F093), SC_ZYYY},
+ {RUNE_C(0x01F0A0), RUNE_C(0x01F0AE), SC_ZYYY},
+ {RUNE_C(0x01F0B1), RUNE_C(0x01F0BF), SC_ZYYY},
+ {RUNE_C(0x01F0C1), RUNE_C(0x01F0CF), SC_ZYYY},
+ {RUNE_C(0x01F0D1), RUNE_C(0x01F0F5), SC_ZYYY},
+ {RUNE_C(0x01F100), RUNE_C(0x01F1AD), SC_ZYYY},
+ {RUNE_C(0x01F1E6), RUNE_C(0x01F1FF), SC_ZYYY},
+ {RUNE_C(0x01F200), RUNE_C(0x01F200), SC_HIRA},
+ {RUNE_C(0x01F201), RUNE_C(0x01F202), SC_ZYYY},
+ {RUNE_C(0x01F210), RUNE_C(0x01F23B), SC_ZYYY},
+ {RUNE_C(0x01F240), RUNE_C(0x01F248), SC_ZYYY},
+ {RUNE_C(0x01F250), RUNE_C(0x01F251), SC_ZYYY},
+ {RUNE_C(0x01F260), RUNE_C(0x01F265), SC_ZYYY},
+ {RUNE_C(0x01F300), RUNE_C(0x01F6D7), SC_ZYYY},
+ {RUNE_C(0x01F6DC), RUNE_C(0x01F6EC), SC_ZYYY},
+ {RUNE_C(0x01F6F0), RUNE_C(0x01F6FC), SC_ZYYY},
+ {RUNE_C(0x01F700), RUNE_C(0x01F776), SC_ZYYY},
+ {RUNE_C(0x01F77B), RUNE_C(0x01F7D9), SC_ZYYY},
+ {RUNE_C(0x01F7E0), RUNE_C(0x01F7EB), SC_ZYYY},
+ {RUNE_C(0x01F7F0), RUNE_C(0x01F7F0), SC_ZYYY},
+ {RUNE_C(0x01F800), RUNE_C(0x01F80B), SC_ZYYY},
+ {RUNE_C(0x01F810), RUNE_C(0x01F847), SC_ZYYY},
+ {RUNE_C(0x01F850), RUNE_C(0x01F859), SC_ZYYY},
+ {RUNE_C(0x01F860), RUNE_C(0x01F887), SC_ZYYY},
+ {RUNE_C(0x01F890), RUNE_C(0x01F8AD), SC_ZYYY},
+ {RUNE_C(0x01F8B0), RUNE_C(0x01F8B1), SC_ZYYY},
+ {RUNE_C(0x01F900), RUNE_C(0x01FA53), SC_ZYYY},
+ {RUNE_C(0x01FA60), RUNE_C(0x01FA6D), SC_ZYYY},
+ {RUNE_C(0x01FA70), RUNE_C(0x01FA7C), SC_ZYYY},
+ {RUNE_C(0x01FA80), RUNE_C(0x01FA88), SC_ZYYY},
+ {RUNE_C(0x01FA90), RUNE_C(0x01FABD), SC_ZYYY},
+ {RUNE_C(0x01FABF), RUNE_C(0x01FAC5), SC_ZYYY},
+ {RUNE_C(0x01FACE), RUNE_C(0x01FADB), SC_ZYYY},
+ {RUNE_C(0x01FAE0), RUNE_C(0x01FAE8), SC_ZYYY},
+ {RUNE_C(0x01FAF0), RUNE_C(0x01FAF8), SC_ZYYY},
+ {RUNE_C(0x01FB00), RUNE_C(0x01FB92), SC_ZYYY},
+ {RUNE_C(0x01FB94), RUNE_C(0x01FBCA), SC_ZYYY},
+ {RUNE_C(0x01FBF0), RUNE_C(0x01FBF9), SC_ZYYY},
+ {RUNE_C(0x020000), RUNE_C(0x02A6DF), SC_HANI},
+ {RUNE_C(0x02A700), RUNE_C(0x02B739), SC_HANI},
+ {RUNE_C(0x02B740), RUNE_C(0x02B81D), SC_HANI},
+ {RUNE_C(0x02B820), RUNE_C(0x02CEA1), SC_HANI},
+ {RUNE_C(0x02CEB0), RUNE_C(0x02EBE0), SC_HANI},
+ {RUNE_C(0x02EBF0), RUNE_C(0x02EE5D), SC_HANI},
+ {RUNE_C(0x02F800), RUNE_C(0x02FA1D), SC_HANI},
+ {RUNE_C(0x030000), RUNE_C(0x03134A), SC_HANI},
+ {RUNE_C(0x031350), RUNE_C(0x0323AF), SC_HANI},
+ {RUNE_C(0x0E0001), RUNE_C(0x0E0001), SC_ZYYY},
+ {RUNE_C(0x0E0020), RUNE_C(0x0E007F), SC_ZYYY},
+ {RUNE_C(0x0E0100), RUNE_C(0x0E01EF), SC_ZINH},
+};
+
+__MLIB_DEFINE_BSEARCH(enum uprop_sc, lookup, SC_ZZZZ)
+
+enum uprop_sc
+uprop_get_sc(rune ch)
+{
+ return ch <= lengthof(lookup_lat1) ? lookup_lat1[ch] : mlib_lookup(ch);
+}