Created
February 17, 2017 18:47
-
-
Save bhamiltoncx/7a2d9f31cedf2647f084d907787a07db to your computer and use it in GitHub Desktop.
Unicode code point classifier using new ANTLR4 full Unicode syntax
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
/** classify21.g4 | |
Automatically generated Unicode 9.0.0 codepoint classification grammar. | |
Generated by "makeGrammars.py". | |
Author: Jonathan D. Lettvin ([email protected]) | |
Date: 20161023 | |
Legal: Copyright(c) Jonathan D. Lettvin, All Rights Reserved | |
License:GPL 3.0 | |
Rules are generated by extracting from: | |
lang: local/Blocks.txt | |
meta: local/UnicodeData-3.0.0.html | |
data: local/UnicodeData.txt | |
name: local/PropertyValueAliases.txt | |
See Makefile where wget downloads these files from | |
site: ftp://ftp.unicode.org/Public/ | |
*/ | |
grammar classify; | |
codepoint: | |
CLASSIFY_Cc // cntrl | |
| CLASSIFY_Cf // Format | |
| CLASSIFY_Co // Private_Use | |
| CLASSIFY_Cs // Surrogate | |
| CLASSIFY_Ll // Lowercase_Letter | |
| CLASSIFY_Lm // Modifier_Letter | |
| CLASSIFY_Lo // Other_Letter | |
| CLASSIFY_Lt // Titlecase_Letter | |
| CLASSIFY_Lu // Uppercase_Letter | |
| CLASSIFY_Mc // Spacing_Mark | |
| CLASSIFY_Me // Enclosing_Mark | |
| CLASSIFY_Mn // Nonspacing_Mark | |
| CLASSIFY_Nd // digit | |
| CLASSIFY_Nl // Letter_Number | |
| CLASSIFY_No // Other_Number | |
| CLASSIFY_Pc // Connector_Punctuation | |
| CLASSIFY_Pd // Dash_Punctuation | |
| CLASSIFY_Pe // Close_Punctuation | |
| CLASSIFY_Pf // Final_Punctuation | |
| CLASSIFY_Pi // Initial_Punctuation | |
| CLASSIFY_Po // Other_Punctuation | |
| CLASSIFY_Ps // Open_Punctuation | |
| CLASSIFY_Sc // Currency_Symbol | |
| CLASSIFY_Sk // Modifier_Symbol | |
| CLASSIFY_Sm // Math_Symbol | |
| CLASSIFY_So // Other_Symbol | |
| CLASSIFY_Zl // Line_Separator | |
| CLASSIFY_Zp // Paragraph_Separator | |
| CLASSIFY_Zs // Space_Separator | |
; | |
CLASSIFY_Cc: // cntrl | |
'\u{0000}'..'\u{001f}' // [�..] Basic Latin | |
| '\u{007f}'..'\u{009f}' // [..] Basic Latin | |
; | |
CLASSIFY_Cf: // Format | |
'\u{00ad}' // [] Latin-1 Supplement | |
| '\u{0600}'..'\u{0605}' // [..] Arabic | |
| '\u{061c}' // [] Arabic | |
| '\u{06dd}' // [] Arabic | |
| '\u{070f}' // [] Syriac | |
| '\u{08e2}' // [] Arabic Extended-A | |
| '\u{180e}' // [] Mongolian | |
| '\u{200b}'..'\u{200f}' // [..] General Punctuation | |
| '\u{202a}'..'\u{202e}' // [..] General Punctuation | |
| '\u{2060}'..'\u{206f}' // [..] General Punctuation | |
| '\u{feff}' // [] Arabic Presentation Forms-B | |
| '\u{fff9}'..'\u{fffb}' // [..] Specials | |
| '\u{110bd}' // [] Kaithi | |
| '\u{1bca0}'..'\u{1bca3}' // [..] Shorthand Format Controls | |
| '\u{1d173}'..'\u{1d17a}' // [..] Musical Symbols | |
| '\u{e0001}'..'\u{e007f}' // [..] Tags | |
; | |
CLASSIFY_Co: // Private_Use | |
'\u{e000}'..'\u{f8ff}' // [..] Private Use Area | |
| '\u{f0000}'..'\u{10fffd}' // [..] Supplementary Private Use Area-A | |
; | |
CLASSIFY_Cs: // Surrogate | |
'\u{d800}'..'\u{dfff}' // [���..���] High Surrogates | |
; | |
CLASSIFY_Ll: // Lowercase_Letter | |
'\u{0061}'..'\u{007a}' // [a..z] Basic Latin | |
| '\u{00b5}' // [µ] Latin-1 Supplement | |
| '\u{00df}'..'\u{00f6}' // [ß..ö] Latin-1 Supplement | |
| '\u{00f8}'..'\u{00ff}' // [ø..ÿ] Latin-1 Supplement | |
| '\u{0101}' // [ā] Latin Extended-A | |
| '\u{0103}' // [ă] Latin Extended-A | |
| '\u{0105}' // [ą] Latin Extended-A | |
| '\u{0107}' // [ć] Latin Extended-A | |
| '\u{0109}' // [ĉ] Latin Extended-A | |
| '\u{010b}' // [ċ] Latin Extended-A | |
| '\u{010d}' // [č] Latin Extended-A | |
| '\u{010f}' // [ď] Latin Extended-A | |
| '\u{0111}' // [đ] Latin Extended-A | |
| '\u{0113}' // [ē] Latin Extended-A | |
| '\u{0115}' // [ĕ] Latin Extended-A | |
| '\u{0117}' // [ė] Latin Extended-A | |
| '\u{0119}' // [ę] Latin Extended-A | |
| '\u{011b}' // [ě] Latin Extended-A | |
| '\u{011d}' // [ĝ] Latin Extended-A | |
| '\u{011f}' // [ğ] Latin Extended-A | |
| '\u{0121}' // [ġ] Latin Extended-A | |
| '\u{0123}' // [ģ] Latin Extended-A | |
| '\u{0125}' // [ĥ] Latin Extended-A | |
| '\u{0127}' // [ħ] Latin Extended-A | |
| '\u{0129}' // [ĩ] Latin Extended-A | |
| '\u{012b}' // [ī] Latin Extended-A | |
| '\u{012d}' // [ĭ] Latin Extended-A | |
| '\u{012f}' // [į] Latin Extended-A | |
| '\u{0131}' // [ı] Latin Extended-A | |
| '\u{0133}' // [ij] Latin Extended-A | |
| '\u{0135}' // [ĵ] Latin Extended-A | |
| '\u{0137}'..'\u{0138}' // [ķ..ĸ] Latin Extended-A | |
| '\u{013a}' // [ĺ] Latin Extended-A | |
| '\u{013c}' // [ļ] Latin Extended-A | |
| '\u{013e}' // [ľ] Latin Extended-A | |
| '\u{0140}' // [ŀ] Latin Extended-A | |
| '\u{0142}' // [ł] Latin Extended-A | |
| '\u{0144}' // [ń] Latin Extended-A | |
| '\u{0146}' // [ņ] Latin Extended-A | |
| '\u{0148}'..'\u{0149}' // [ň..ʼn] Latin Extended-A | |
| '\u{014b}' // [ŋ] Latin Extended-A | |
| '\u{014d}' // [ō] Latin Extended-A | |
| '\u{014f}' // [ŏ] Latin Extended-A | |
| '\u{0151}' // [ő] Latin Extended-A | |
| '\u{0153}' // [œ] Latin Extended-A | |
| '\u{0155}' // [ŕ] Latin Extended-A | |
| '\u{0157}' // [ŗ] Latin Extended-A | |
| '\u{0159}' // [ř] Latin Extended-A | |
| '\u{015b}' // [ś] Latin Extended-A | |
| '\u{015d}' // [ŝ] Latin Extended-A | |
| '\u{015f}' // [ş] Latin Extended-A | |
| '\u{0161}' // [š] Latin Extended-A | |
| '\u{0163}' // [ţ] Latin Extended-A | |
| '\u{0165}' // [ť] Latin Extended-A | |
| '\u{0167}' // [ŧ] Latin Extended-A | |
| '\u{0169}' // [ũ] Latin Extended-A | |
| '\u{016b}' // [ū] Latin Extended-A | |
| '\u{016d}' // [ŭ] Latin Extended-A | |
| '\u{016f}' // [ů] Latin Extended-A | |
| '\u{0171}' // [ű] Latin Extended-A | |
| '\u{0173}' // [ų] Latin Extended-A | |
| '\u{0175}' // [ŵ] Latin Extended-A | |
| '\u{0177}' // [ŷ] Latin Extended-A | |
| '\u{017a}' // [ź] Latin Extended-A | |
| '\u{017c}' // [ż] Latin Extended-A | |
| '\u{017e}'..'\u{0180}' // [ž..ƀ] Latin Extended-A | |
| '\u{0183}' // [ƃ] Latin Extended-B | |
| '\u{0185}' // [ƅ] Latin Extended-B | |
| '\u{0188}' // [ƈ] Latin Extended-B | |
| '\u{018c}'..'\u{018d}' // [ƌ..ƍ] Latin Extended-B | |
| '\u{0192}' // [ƒ] Latin Extended-B | |
| '\u{0195}' // [ƕ] Latin Extended-B | |
| '\u{0199}'..'\u{019b}' // [ƙ..ƛ] Latin Extended-B | |
| '\u{019e}' // [ƞ] Latin Extended-B | |
| '\u{01a1}' // [ơ] Latin Extended-B | |
| '\u{01a3}' // [ƣ] Latin Extended-B | |
| '\u{01a5}' // [ƥ] Latin Extended-B | |
| '\u{01a8}' // [ƨ] Latin Extended-B | |
| '\u{01aa}'..'\u{01ab}' // [ƪ..ƫ] Latin Extended-B | |
| '\u{01ad}' // [ƭ] Latin Extended-B | |
| '\u{01b0}' // [ư] Latin Extended-B | |
| '\u{01b4}' // [ƴ] Latin Extended-B | |
| '\u{01b6}' // [ƶ] Latin Extended-B | |
| '\u{01b9}'..'\u{01ba}' // [ƹ..ƺ] Latin Extended-B | |
| '\u{01bd}'..'\u{01bf}' // [ƽ..ƿ] Latin Extended-B | |
| '\u{01c6}' // [dž] Latin Extended-B | |
| '\u{01c9}' // [lj] Latin Extended-B | |
| '\u{01cc}' // [nj] Latin Extended-B | |
| '\u{01ce}' // [ǎ] Latin Extended-B | |
| '\u{01d0}' // [ǐ] Latin Extended-B | |
| '\u{01d2}' // [ǒ] Latin Extended-B | |
| '\u{01d4}' // [ǔ] Latin Extended-B | |
| '\u{01d6}' // [ǖ] Latin Extended-B | |
| '\u{01d8}' // [ǘ] Latin Extended-B | |
| '\u{01da}' // [ǚ] Latin Extended-B | |
| '\u{01dc}'..'\u{01dd}' // [ǜ..ǝ] Latin Extended-B | |
| '\u{01df}' // [ǟ] Latin Extended-B | |
| '\u{01e1}' // [ǡ] Latin Extended-B | |
| '\u{01e3}' // [ǣ] Latin Extended-B | |
| '\u{01e5}' // [ǥ] Latin Extended-B | |
| '\u{01e7}' // [ǧ] Latin Extended-B | |
| '\u{01e9}' // [ǩ] Latin Extended-B | |
| '\u{01eb}' // [ǫ] Latin Extended-B | |
| '\u{01ed}' // [ǭ] Latin Extended-B | |
| '\u{01ef}'..'\u{01f0}' // [ǯ..ǰ] Latin Extended-B | |
| '\u{01f3}' // [dz] Latin Extended-B | |
| '\u{01f5}' // [ǵ] Latin Extended-B | |
| '\u{01f9}' // [ǹ] Latin Extended-B | |
| '\u{01fb}' // [ǻ] Latin Extended-B | |
| '\u{01fd}' // [ǽ] Latin Extended-B | |
| '\u{01ff}' // [ǿ] Latin Extended-B | |
| '\u{0201}' // [ȁ] Latin Extended-B | |
| '\u{0203}' // [ȃ] Latin Extended-B | |
| '\u{0205}' // [ȅ] Latin Extended-B | |
| '\u{0207}' // [ȇ] Latin Extended-B | |
| '\u{0209}' // [ȉ] Latin Extended-B | |
| '\u{020b}' // [ȋ] Latin Extended-B | |
| '\u{020d}' // [ȍ] Latin Extended-B | |
| '\u{020f}' // [ȏ] Latin Extended-B | |
| '\u{0211}' // [ȑ] Latin Extended-B | |
| '\u{0213}' // [ȓ] Latin Extended-B | |
| '\u{0215}' // [ȕ] Latin Extended-B | |
| '\u{0217}' // [ȗ] Latin Extended-B | |
| '\u{0219}' // [ș] Latin Extended-B | |
| '\u{021b}' // [ț] Latin Extended-B | |
| '\u{021d}' // [ȝ] Latin Extended-B | |
| '\u{021f}' // [ȟ] Latin Extended-B | |
| '\u{0221}' // [ȡ] Latin Extended-B | |
| '\u{0223}' // [ȣ] Latin Extended-B | |
| '\u{0225}' // [ȥ] Latin Extended-B | |
| '\u{0227}' // [ȧ] Latin Extended-B | |
| '\u{0229}' // [ȩ] Latin Extended-B | |
| '\u{022b}' // [ȫ] Latin Extended-B | |
| '\u{022d}' // [ȭ] Latin Extended-B | |
| '\u{022f}' // [ȯ] Latin Extended-B | |
| '\u{0231}' // [ȱ] Latin Extended-B | |
| '\u{0233}'..'\u{0239}' // [ȳ..ȹ] Latin Extended-B | |
| '\u{023c}' // [ȼ] Latin Extended-B | |
| '\u{023f}'..'\u{0240}' // [ȿ..ɀ] Latin Extended-B | |
| '\u{0242}' // [ɂ] Latin Extended-B | |
| '\u{0247}' // [ɇ] Latin Extended-B | |
| '\u{0249}' // [ɉ] Latin Extended-B | |
| '\u{024b}' // [ɋ] Latin Extended-B | |
| '\u{024d}' // [ɍ] Latin Extended-B | |
| '\u{024f}'..'\u{0293}' // [ɏ..ʓ] Latin Extended-B | |
| '\u{0295}'..'\u{02af}' // [ʕ..ʯ] IPA Extensions | |
| '\u{0371}' // [ͱ] Greek and Coptic | |
| '\u{0373}' // [ͳ] Greek and Coptic | |
| '\u{0377}' // [ͷ] Greek and Coptic | |
| '\u{037b}'..'\u{037d}' // [ͻ..ͽ] Greek and Coptic | |
| '\u{0390}' // [ΐ] Greek and Coptic | |
| '\u{03ac}'..'\u{03ce}' // [ά..ώ] Greek and Coptic | |
| '\u{03d0}'..'\u{03d1}' // [ϐ..ϑ] Greek and Coptic | |
| '\u{03d5}'..'\u{03d7}' // [ϕ..ϗ] Greek and Coptic | |
| '\u{03d9}' // [ϙ] Greek and Coptic | |
| '\u{03db}' // [ϛ] Greek and Coptic | |
| '\u{03dd}' // [ϝ] Greek and Coptic | |
| '\u{03df}' // [ϟ] Greek and Coptic | |
| '\u{03e1}' // [ϡ] Greek and Coptic | |
| '\u{03e3}' // [ϣ] Greek and Coptic | |
| '\u{03e5}' // [ϥ] Greek and Coptic | |
| '\u{03e7}' // [ϧ] Greek and Coptic | |
| '\u{03e9}' // [ϩ] Greek and Coptic | |
| '\u{03eb}' // [ϫ] Greek and Coptic | |
| '\u{03ed}' // [ϭ] Greek and Coptic | |
| '\u{03ef}'..'\u{03f3}' // [ϯ..ϳ] Greek and Coptic | |
| '\u{03f5}' // [ϵ] Greek and Coptic | |
| '\u{03f8}' // [ϸ] Greek and Coptic | |
| '\u{03fb}'..'\u{03fc}' // [ϻ..ϼ] Greek and Coptic | |
| '\u{0430}'..'\u{045f}' // [а..џ] Cyrillic | |
| '\u{0461}' // [ѡ] Cyrillic | |
| '\u{0463}' // [ѣ] Cyrillic | |
| '\u{0465}' // [ѥ] Cyrillic | |
| '\u{0467}' // [ѧ] Cyrillic | |
| '\u{0469}' // [ѩ] Cyrillic | |
| '\u{046b}' // [ѫ] Cyrillic | |
| '\u{046d}' // [ѭ] Cyrillic | |
| '\u{046f}' // [ѯ] Cyrillic | |
| '\u{0471}' // [ѱ] Cyrillic | |
| '\u{0473}' // [ѳ] Cyrillic | |
| '\u{0475}' // [ѵ] Cyrillic | |
| '\u{0477}' // [ѷ] Cyrillic | |
| '\u{0479}' // [ѹ] Cyrillic | |
| '\u{047b}' // [ѻ] Cyrillic | |
| '\u{047d}' // [ѽ] Cyrillic | |
| '\u{047f}' // [ѿ] Cyrillic | |
| '\u{0481}' // [ҁ] Cyrillic | |
| '\u{048b}' // [ҋ] Cyrillic | |
| '\u{048d}' // [ҍ] Cyrillic | |
| '\u{048f}' // [ҏ] Cyrillic | |
| '\u{0491}' // [ґ] Cyrillic | |
| '\u{0493}' // [ғ] Cyrillic | |
| '\u{0495}' // [ҕ] Cyrillic | |
| '\u{0497}' // [җ] Cyrillic | |
| '\u{0499}' // [ҙ] Cyrillic | |
| '\u{049b}' // [қ] Cyrillic | |
| '\u{049d}' // [ҝ] Cyrillic | |
| '\u{049f}' // [ҟ] Cyrillic | |
| '\u{04a1}' // [ҡ] Cyrillic | |
| '\u{04a3}' // [ң] Cyrillic | |
| '\u{04a5}' // [ҥ] Cyrillic | |
| '\u{04a7}' // [ҧ] Cyrillic | |
| '\u{04a9}' // [ҩ] Cyrillic | |
| '\u{04ab}' // [ҫ] Cyrillic | |
| '\u{04ad}' // [ҭ] Cyrillic | |
| '\u{04af}' // [ү] Cyrillic | |
| '\u{04b1}' // [ұ] Cyrillic | |
| '\u{04b3}' // [ҳ] Cyrillic | |
| '\u{04b5}' // [ҵ] Cyrillic | |
| '\u{04b7}' // [ҷ] Cyrillic | |
| '\u{04b9}' // [ҹ] Cyrillic | |
| '\u{04bb}' // [һ] Cyrillic | |
| '\u{04bd}' // [ҽ] Cyrillic | |
| '\u{04bf}' // [ҿ] Cyrillic | |
| '\u{04c2}' // [ӂ] Cyrillic | |
| '\u{04c4}' // [ӄ] Cyrillic | |
| '\u{04c6}' // [ӆ] Cyrillic | |
| '\u{04c8}' // [ӈ] Cyrillic | |
| '\u{04ca}' // [ӊ] Cyrillic | |
| '\u{04cc}' // [ӌ] Cyrillic | |
| '\u{04ce}'..'\u{04cf}' // [ӎ..ӏ] Cyrillic | |
| '\u{04d1}' // [ӑ] Cyrillic | |
| '\u{04d3}' // [ӓ] Cyrillic | |
| '\u{04d5}' // [ӕ] Cyrillic | |
| '\u{04d7}' // [ӗ] Cyrillic | |
| '\u{04d9}' // [ә] Cyrillic | |
| '\u{04db}' // [ӛ] Cyrillic | |
| '\u{04dd}' // [ӝ] Cyrillic | |
| '\u{04df}' // [ӟ] Cyrillic | |
| '\u{04e1}' // [ӡ] Cyrillic | |
| '\u{04e3}' // [ӣ] Cyrillic | |
| '\u{04e5}' // [ӥ] Cyrillic | |
| '\u{04e7}' // [ӧ] Cyrillic | |
| '\u{04e9}' // [ө] Cyrillic | |
| '\u{04eb}' // [ӫ] Cyrillic | |
| '\u{04ed}' // [ӭ] Cyrillic | |
| '\u{04ef}' // [ӯ] Cyrillic | |
| '\u{04f1}' // [ӱ] Cyrillic | |
| '\u{04f3}' // [ӳ] Cyrillic | |
| '\u{04f5}' // [ӵ] Cyrillic | |
| '\u{04f7}' // [ӷ] Cyrillic | |
| '\u{04f9}' // [ӹ] Cyrillic | |
| '\u{04fb}' // [ӻ] Cyrillic | |
| '\u{04fd}' // [ӽ] Cyrillic | |
| '\u{04ff}' // [ӿ] Cyrillic | |
| '\u{0501}' // [ԁ] Cyrillic Supplement | |
| '\u{0503}' // [ԃ] Cyrillic Supplement | |
| '\u{0505}' // [ԅ] Cyrillic Supplement | |
| '\u{0507}' // [ԇ] Cyrillic Supplement | |
| '\u{0509}' // [ԉ] Cyrillic Supplement | |
| '\u{050b}' // [ԋ] Cyrillic Supplement | |
| '\u{050d}' // [ԍ] Cyrillic Supplement | |
| '\u{050f}' // [ԏ] Cyrillic Supplement | |
| '\u{0511}' // [ԑ] Cyrillic Supplement | |
| '\u{0513}' // [ԓ] Cyrillic Supplement | |
| '\u{0515}' // [ԕ] Cyrillic Supplement | |
| '\u{0517}' // [ԗ] Cyrillic Supplement | |
| '\u{0519}' // [ԙ] Cyrillic Supplement | |
| '\u{051b}' // [ԛ] Cyrillic Supplement | |
| '\u{051d}' // [ԝ] Cyrillic Supplement | |
| '\u{051f}' // [ԟ] Cyrillic Supplement | |
| '\u{0521}' // [ԡ] Cyrillic Supplement | |
| '\u{0523}' // [ԣ] Cyrillic Supplement | |
| '\u{0525}' // [ԥ] Cyrillic Supplement | |
| '\u{0527}' // [ԧ] Cyrillic Supplement | |
| '\u{0529}' // [ԩ] Cyrillic Supplement | |
| '\u{052b}' // [ԫ] Cyrillic Supplement | |
| '\u{052d}' // [ԭ] Cyrillic Supplement | |
| '\u{052f}' // [ԯ] Cyrillic Supplement | |
| '\u{0561}'..'\u{0587}' // [ա..և] Armenian | |
| '\u{13f8}'..'\u{13fd}' // [ᏸ..ᏽ] Cherokee | |
| '\u{1c80}'..'\u{1c88}' // [ᲀ..ᲈ] Cyrillic Extended-C | |
| '\u{1d00}'..'\u{1d2b}' // [ᴀ..ᴫ] Phonetic Extensions | |
| '\u{1d6b}'..'\u{1d77}' // [ᵫ..ᵷ] Phonetic Extensions | |
| '\u{1d79}'..'\u{1d9a}' // [ᵹ..ᶚ] Phonetic Extensions | |
| '\u{1e01}' // [ḁ] Latin Extended Additional | |
| '\u{1e03}' // [ḃ] Latin Extended Additional | |
| '\u{1e05}' // [ḅ] Latin Extended Additional | |
| '\u{1e07}' // [ḇ] Latin Extended Additional | |
| '\u{1e09}' // [ḉ] Latin Extended Additional | |
| '\u{1e0b}' // [ḋ] Latin Extended Additional | |
| '\u{1e0d}' // [ḍ] Latin Extended Additional | |
| '\u{1e0f}' // [ḏ] Latin Extended Additional | |
| '\u{1e11}' // [ḑ] Latin Extended Additional | |
| '\u{1e13}' // [ḓ] Latin Extended Additional | |
| '\u{1e15}' // [ḕ] Latin Extended Additional | |
| '\u{1e17}' // [ḗ] Latin Extended Additional | |
| '\u{1e19}' // [ḙ] Latin Extended Additional | |
| '\u{1e1b}' // [ḛ] Latin Extended Additional | |
| '\u{1e1d}' // [ḝ] Latin Extended Additional | |
| '\u{1e1f}' // [ḟ] Latin Extended Additional | |
| '\u{1e21}' // [ḡ] Latin Extended Additional | |
| '\u{1e23}' // [ḣ] Latin Extended Additional | |
| '\u{1e25}' // [ḥ] Latin Extended Additional | |
| '\u{1e27}' // [ḧ] Latin Extended Additional | |
| '\u{1e29}' // [ḩ] Latin Extended Additional | |
| '\u{1e2b}' // [ḫ] Latin Extended Additional | |
| '\u{1e2d}' // [ḭ] Latin Extended Additional | |
| '\u{1e2f}' // [ḯ] Latin Extended Additional | |
| '\u{1e31}' // [ḱ] Latin Extended Additional | |
| '\u{1e33}' // [ḳ] Latin Extended Additional | |
| '\u{1e35}' // [ḵ] Latin Extended Additional | |
| '\u{1e37}' // [ḷ] Latin Extended Additional | |
| '\u{1e39}' // [ḹ] Latin Extended Additional | |
| '\u{1e3b}' // [ḻ] Latin Extended Additional | |
| '\u{1e3d}' // [ḽ] Latin Extended Additional | |
| '\u{1e3f}' // [ḿ] Latin Extended Additional | |
| '\u{1e41}' // [ṁ] Latin Extended Additional | |
| '\u{1e43}' // [ṃ] Latin Extended Additional | |
| '\u{1e45}' // [ṅ] Latin Extended Additional | |
| '\u{1e47}' // [ṇ] Latin Extended Additional | |
| '\u{1e49}' // [ṉ] Latin Extended Additional | |
| '\u{1e4b}' // [ṋ] Latin Extended Additional | |
| '\u{1e4d}' // [ṍ] Latin Extended Additional | |
| '\u{1e4f}' // [ṏ] Latin Extended Additional | |
| '\u{1e51}' // [ṑ] Latin Extended Additional | |
| '\u{1e53}' // [ṓ] Latin Extended Additional | |
| '\u{1e55}' // [ṕ] Latin Extended Additional | |
| '\u{1e57}' // [ṗ] Latin Extended Additional | |
| '\u{1e59}' // [ṙ] Latin Extended Additional | |
| '\u{1e5b}' // [ṛ] Latin Extended Additional | |
| '\u{1e5d}' // [ṝ] Latin Extended Additional | |
| '\u{1e5f}' // [ṟ] Latin Extended Additional | |
| '\u{1e61}' // [ṡ] Latin Extended Additional | |
| '\u{1e63}' // [ṣ] Latin Extended Additional | |
| '\u{1e65}' // [ṥ] Latin Extended Additional | |
| '\u{1e67}' // [ṧ] Latin Extended Additional | |
| '\u{1e69}' // [ṩ] Latin Extended Additional | |
| '\u{1e6b}' // [ṫ] Latin Extended Additional | |
| '\u{1e6d}' // [ṭ] Latin Extended Additional | |
| '\u{1e6f}' // [ṯ] Latin Extended Additional | |
| '\u{1e71}' // [ṱ] Latin Extended Additional | |
| '\u{1e73}' // [ṳ] Latin Extended Additional | |
| '\u{1e75}' // [ṵ] Latin Extended Additional | |
| '\u{1e77}' // [ṷ] Latin Extended Additional | |
| '\u{1e79}' // [ṹ] Latin Extended Additional | |
| '\u{1e7b}' // [ṻ] Latin Extended Additional | |
| '\u{1e7d}' // [ṽ] Latin Extended Additional | |
| '\u{1e7f}' // [ṿ] Latin Extended Additional | |
| '\u{1e81}' // [ẁ] Latin Extended Additional | |
| '\u{1e83}' // [ẃ] Latin Extended Additional | |
| '\u{1e85}' // [ẅ] Latin Extended Additional | |
| '\u{1e87}' // [ẇ] Latin Extended Additional | |
| '\u{1e89}' // [ẉ] Latin Extended Additional | |
| '\u{1e8b}' // [ẋ] Latin Extended Additional | |
| '\u{1e8d}' // [ẍ] Latin Extended Additional | |
| '\u{1e8f}' // [ẏ] Latin Extended Additional | |
| '\u{1e91}' // [ẑ] Latin Extended Additional | |
| '\u{1e93}' // [ẓ] Latin Extended Additional | |
| '\u{1e95}'..'\u{1e9d}' // [ẕ..ẝ] Latin Extended Additional | |
| '\u{1e9f}' // [ẟ] Latin Extended Additional | |
| '\u{1ea1}' // [ạ] Latin Extended Additional | |
| '\u{1ea3}' // [ả] Latin Extended Additional | |
| '\u{1ea5}' // [ấ] Latin Extended Additional | |
| '\u{1ea7}' // [ầ] Latin Extended Additional | |
| '\u{1ea9}' // [ẩ] Latin Extended Additional | |
| '\u{1eab}' // [ẫ] Latin Extended Additional | |
| '\u{1ead}' // [ậ] Latin Extended Additional | |
| '\u{1eaf}' // [ắ] Latin Extended Additional | |
| '\u{1eb1}' // [ằ] Latin Extended Additional | |
| '\u{1eb3}' // [ẳ] Latin Extended Additional | |
| '\u{1eb5}' // [ẵ] Latin Extended Additional | |
| '\u{1eb7}' // [ặ] Latin Extended Additional | |
| '\u{1eb9}' // [ẹ] Latin Extended Additional | |
| '\u{1ebb}' // [ẻ] Latin Extended Additional | |
| '\u{1ebd}' // [ẽ] Latin Extended Additional | |
| '\u{1ebf}' // [ế] Latin Extended Additional | |
| '\u{1ec1}' // [ề] Latin Extended Additional | |
| '\u{1ec3}' // [ể] Latin Extended Additional | |
| '\u{1ec5}' // [ễ] Latin Extended Additional | |
| '\u{1ec7}' // [ệ] Latin Extended Additional | |
| '\u{1ec9}' // [ỉ] Latin Extended Additional | |
| '\u{1ecb}' // [ị] Latin Extended Additional | |
| '\u{1ecd}' // [ọ] Latin Extended Additional | |
| '\u{1ecf}' // [ỏ] Latin Extended Additional | |
| '\u{1ed1}' // [ố] Latin Extended Additional | |
| '\u{1ed3}' // [ồ] Latin Extended Additional | |
| '\u{1ed5}' // [ổ] Latin Extended Additional | |
| '\u{1ed7}' // [ỗ] Latin Extended Additional | |
| '\u{1ed9}' // [ộ] Latin Extended Additional | |
| '\u{1edb}' // [ớ] Latin Extended Additional | |
| '\u{1edd}' // [ờ] Latin Extended Additional | |
| '\u{1edf}' // [ở] Latin Extended Additional | |
| '\u{1ee1}' // [ỡ] Latin Extended Additional | |
| '\u{1ee3}' // [ợ] Latin Extended Additional | |
| '\u{1ee5}' // [ụ] Latin Extended Additional | |
| '\u{1ee7}' // [ủ] Latin Extended Additional | |
| '\u{1ee9}' // [ứ] Latin Extended Additional | |
| '\u{1eeb}' // [ừ] Latin Extended Additional | |
| '\u{1eed}' // [ử] Latin Extended Additional | |
| '\u{1eef}' // [ữ] Latin Extended Additional | |
| '\u{1ef1}' // [ự] Latin Extended Additional | |
| '\u{1ef3}' // [ỳ] Latin Extended Additional | |
| '\u{1ef5}' // [ỵ] Latin Extended Additional | |
| '\u{1ef7}' // [ỷ] Latin Extended Additional | |
| '\u{1ef9}' // [ỹ] Latin Extended Additional | |
| '\u{1efb}' // [ỻ] Latin Extended Additional | |
| '\u{1efd}' // [ỽ] Latin Extended Additional | |
| '\u{1eff}'..'\u{1f07}' // [ỿ..ἇ] Latin Extended Additional | |
| '\u{1f10}'..'\u{1f15}' // [ἐ..ἕ] Greek Extended | |
| '\u{1f20}'..'\u{1f27}' // [ἠ..ἧ] Greek Extended | |
| '\u{1f30}'..'\u{1f37}' // [ἰ..ἷ] Greek Extended | |
| '\u{1f40}'..'\u{1f45}' // [ὀ..ὅ] Greek Extended | |
| '\u{1f50}'..'\u{1f57}' // [ὐ..ὗ] Greek Extended | |
| '\u{1f60}'..'\u{1f67}' // [ὠ..ὧ] Greek Extended | |
| '\u{1f70}'..'\u{1f87}' // [ὰ..ᾇ] Greek Extended | |
| '\u{1f90}'..'\u{1f97}' // [ᾐ..ᾗ] Greek Extended | |
| '\u{1fa0}'..'\u{1fa7}' // [ᾠ..ᾧ] Greek Extended | |
| '\u{1fb0}'..'\u{1fb7}' // [ᾰ..ᾷ] Greek Extended | |
| '\u{1fbe}' // [ι] Greek Extended | |
| '\u{1fc2}'..'\u{1fc7}' // [ῂ..ῇ] Greek Extended | |
| '\u{1fd0}'..'\u{1fd7}' // [ῐ..ῗ] Greek Extended | |
| '\u{1fe0}'..'\u{1fe7}' // [ῠ..ῧ] Greek Extended | |
| '\u{1ff2}'..'\u{1ff7}' // [ῲ..ῷ] Greek Extended | |
| '\u{210a}' // [ℊ] Letterlike Symbols | |
| '\u{210e}'..'\u{210f}' // [ℎ..ℏ] Letterlike Symbols | |
| '\u{2113}' // [ℓ] Letterlike Symbols | |
| '\u{212f}' // [ℯ] Letterlike Symbols | |
| '\u{2134}' // [ℴ] Letterlike Symbols | |
| '\u{2139}' // [ℹ] Letterlike Symbols | |
| '\u{213c}'..'\u{213d}' // [ℼ..ℽ] Letterlike Symbols | |
| '\u{2146}'..'\u{2149}' // [ⅆ..ⅉ] Letterlike Symbols | |
| '\u{214e}' // [ⅎ] Letterlike Symbols | |
| '\u{2184}' // [ↄ] Number Forms | |
| '\u{2c30}'..'\u{2c5e}' // [ⰰ..ⱞ] Glagolitic | |
| '\u{2c61}' // [ⱡ] Latin Extended-C | |
| '\u{2c65}'..'\u{2c66}' // [ⱥ..ⱦ] Latin Extended-C | |
| '\u{2c68}' // [ⱨ] Latin Extended-C | |
| '\u{2c6a}' // [ⱪ] Latin Extended-C | |
| '\u{2c6c}' // [ⱬ] Latin Extended-C | |
| '\u{2c71}' // [ⱱ] Latin Extended-C | |
| '\u{2c73}'..'\u{2c74}' // [ⱳ..ⱴ] Latin Extended-C | |
| '\u{2c76}'..'\u{2c7b}' // [ⱶ..ⱻ] Latin Extended-C | |
| '\u{2c81}' // [ⲁ] Coptic | |
| '\u{2c83}' // [ⲃ] Coptic | |
| '\u{2c85}' // [ⲅ] Coptic | |
| '\u{2c87}' // [ⲇ] Coptic | |
| '\u{2c89}' // [ⲉ] Coptic | |
| '\u{2c8b}' // [ⲋ] Coptic | |
| '\u{2c8d}' // [ⲍ] Coptic | |
| '\u{2c8f}' // [ⲏ] Coptic | |
| '\u{2c91}' // [ⲑ] Coptic | |
| '\u{2c93}' // [ⲓ] Coptic | |
| '\u{2c95}' // [ⲕ] Coptic | |
| '\u{2c97}' // [ⲗ] Coptic | |
| '\u{2c99}' // [ⲙ] Coptic | |
| '\u{2c9b}' // [ⲛ] Coptic | |
| '\u{2c9d}' // [ⲝ] Coptic | |
| '\u{2c9f}' // [ⲟ] Coptic | |
| '\u{2ca1}' // [ⲡ] Coptic | |
| '\u{2ca3}' // [ⲣ] Coptic | |
| '\u{2ca5}' // [ⲥ] Coptic | |
| '\u{2ca7}' // [ⲧ] Coptic | |
| '\u{2ca9}' // [ⲩ] Coptic | |
| '\u{2cab}' // [ⲫ] Coptic | |
| '\u{2cad}' // [ⲭ] Coptic | |
| '\u{2caf}' // [ⲯ] Coptic | |
| '\u{2cb1}' // [ⲱ] Coptic | |
| '\u{2cb3}' // [ⲳ] Coptic | |
| '\u{2cb5}' // [ⲵ] Coptic | |
| '\u{2cb7}' // [ⲷ] Coptic | |
| '\u{2cb9}' // [ⲹ] Coptic | |
| '\u{2cbb}' // [ⲻ] Coptic | |
| '\u{2cbd}' // [ⲽ] Coptic | |
| '\u{2cbf}' // [ⲿ] Coptic | |
| '\u{2cc1}' // [ⳁ] Coptic | |
| '\u{2cc3}' // [ⳃ] Coptic | |
| '\u{2cc5}' // [ⳅ] Coptic | |
| '\u{2cc7}' // [ⳇ] Coptic | |
| '\u{2cc9}' // [ⳉ] Coptic | |
| '\u{2ccb}' // [ⳋ] Coptic | |
| '\u{2ccd}' // [ⳍ] Coptic | |
| '\u{2ccf}' // [ⳏ] Coptic | |
| '\u{2cd1}' // [ⳑ] Coptic | |
| '\u{2cd3}' // [ⳓ] Coptic | |
| '\u{2cd5}' // [ⳕ] Coptic | |
| '\u{2cd7}' // [ⳗ] Coptic | |
| '\u{2cd9}' // [ⳙ] Coptic | |
| '\u{2cdb}' // [ⳛ] Coptic | |
| '\u{2cdd}' // [ⳝ] Coptic | |
| '\u{2cdf}' // [ⳟ] Coptic | |
| '\u{2ce1}' // [ⳡ] Coptic | |
| '\u{2ce3}'..'\u{2ce4}' // [ⳣ..ⳤ] Coptic | |
| '\u{2cec}' // [ⳬ] Coptic | |
| '\u{2cee}' // [ⳮ] Coptic | |
| '\u{2cf3}' // [ⳳ] Coptic | |
| '\u{2d00}'..'\u{2d2d}' // [ⴀ..ⴭ] Georgian Supplement | |
| '\u{a641}' // [ꙁ] Cyrillic Extended-B | |
| '\u{a643}' // [ꙃ] Cyrillic Extended-B | |
| '\u{a645}' // [ꙅ] Cyrillic Extended-B | |
| '\u{a647}' // [ꙇ] Cyrillic Extended-B | |
| '\u{a649}' // [ꙉ] Cyrillic Extended-B | |
| '\u{a64b}' // [ꙋ] Cyrillic Extended-B | |
| '\u{a64d}' // [ꙍ] Cyrillic Extended-B | |
| '\u{a64f}' // [ꙏ] Cyrillic Extended-B | |
| '\u{a651}' // [ꙑ] Cyrillic Extended-B | |
| '\u{a653}' // [ꙓ] Cyrillic Extended-B | |
| '\u{a655}' // [ꙕ] Cyrillic Extended-B | |
| '\u{a657}' // [ꙗ] Cyrillic Extended-B | |
| '\u{a659}' // [ꙙ] Cyrillic Extended-B | |
| '\u{a65b}' // [ꙛ] Cyrillic Extended-B | |
| '\u{a65d}' // [ꙝ] Cyrillic Extended-B | |
| '\u{a65f}' // [ꙟ] Cyrillic Extended-B | |
| '\u{a661}' // [ꙡ] Cyrillic Extended-B | |
| '\u{a663}' // [ꙣ] Cyrillic Extended-B | |
| '\u{a665}' // [ꙥ] Cyrillic Extended-B | |
| '\u{a667}' // [ꙧ] Cyrillic Extended-B | |
| '\u{a669}' // [ꙩ] Cyrillic Extended-B | |
| '\u{a66b}' // [ꙫ] Cyrillic Extended-B | |
| '\u{a66d}' // [ꙭ] Cyrillic Extended-B | |
| '\u{a681}' // [ꚁ] Cyrillic Extended-B | |
| '\u{a683}' // [ꚃ] Cyrillic Extended-B | |
| '\u{a685}' // [ꚅ] Cyrillic Extended-B | |
| '\u{a687}' // [ꚇ] Cyrillic Extended-B | |
| '\u{a689}' // [ꚉ] Cyrillic Extended-B | |
| '\u{a68b}' // [ꚋ] Cyrillic Extended-B | |
| '\u{a68d}' // [ꚍ] Cyrillic Extended-B | |
| '\u{a68f}' // [ꚏ] Cyrillic Extended-B | |
| '\u{a691}' // [ꚑ] Cyrillic Extended-B | |
| '\u{a693}' // [ꚓ] Cyrillic Extended-B | |
| '\u{a695}' // [ꚕ] Cyrillic Extended-B | |
| '\u{a697}' // [ꚗ] Cyrillic Extended-B | |
| '\u{a699}' // [ꚙ] Cyrillic Extended-B | |
| '\u{a69b}' // [ꚛ] Cyrillic Extended-B | |
| '\u{a723}' // [ꜣ] Latin Extended-D | |
| '\u{a725}' // [ꜥ] Latin Extended-D | |
| '\u{a727}' // [ꜧ] Latin Extended-D | |
| '\u{a729}' // [ꜩ] Latin Extended-D | |
| '\u{a72b}' // [ꜫ] Latin Extended-D | |
| '\u{a72d}' // [ꜭ] Latin Extended-D | |
| '\u{a72f}'..'\u{a731}' // [ꜯ..ꜱ] Latin Extended-D | |
| '\u{a733}' // [ꜳ] Latin Extended-D | |
| '\u{a735}' // [ꜵ] Latin Extended-D | |
| '\u{a737}' // [ꜷ] Latin Extended-D | |
| '\u{a739}' // [ꜹ] Latin Extended-D | |
| '\u{a73b}' // [ꜻ] Latin Extended-D | |
| '\u{a73d}' // [ꜽ] Latin Extended-D | |
| '\u{a73f}' // [ꜿ] Latin Extended-D | |
| '\u{a741}' // [ꝁ] Latin Extended-D | |
| '\u{a743}' // [ꝃ] Latin Extended-D | |
| '\u{a745}' // [ꝅ] Latin Extended-D | |
| '\u{a747}' // [ꝇ] Latin Extended-D | |
| '\u{a749}' // [ꝉ] Latin Extended-D | |
| '\u{a74b}' // [ꝋ] Latin Extended-D | |
| '\u{a74d}' // [ꝍ] Latin Extended-D | |
| '\u{a74f}' // [ꝏ] Latin Extended-D | |
| '\u{a751}' // [ꝑ] Latin Extended-D | |
| '\u{a753}' // [ꝓ] Latin Extended-D | |
| '\u{a755}' // [ꝕ] Latin Extended-D | |
| '\u{a757}' // [ꝗ] Latin Extended-D | |
| '\u{a759}' // [ꝙ] Latin Extended-D | |
| '\u{a75b}' // [ꝛ] Latin Extended-D | |
| '\u{a75d}' // [ꝝ] Latin Extended-D | |
| '\u{a75f}' // [ꝟ] Latin Extended-D | |
| '\u{a761}' // [ꝡ] Latin Extended-D | |
| '\u{a763}' // [ꝣ] Latin Extended-D | |
| '\u{a765}' // [ꝥ] Latin Extended-D | |
| '\u{a767}' // [ꝧ] Latin Extended-D | |
| '\u{a769}' // [ꝩ] Latin Extended-D | |
| '\u{a76b}' // [ꝫ] Latin Extended-D | |
| '\u{a76d}' // [ꝭ] Latin Extended-D | |
| '\u{a76f}' // [ꝯ] Latin Extended-D | |
| '\u{a771}'..'\u{a778}' // [ꝱ..ꝸ] Latin Extended-D | |
| '\u{a77a}' // [ꝺ] Latin Extended-D | |
| '\u{a77c}' // [ꝼ] Latin Extended-D | |
| '\u{a77f}' // [ꝿ] Latin Extended-D | |
| '\u{a781}' // [ꞁ] Latin Extended-D | |
| '\u{a783}' // [ꞃ] Latin Extended-D | |
| '\u{a785}' // [ꞅ] Latin Extended-D | |
| '\u{a787}' // [ꞇ] Latin Extended-D | |
| '\u{a78c}' // [ꞌ] Latin Extended-D | |
| '\u{a78e}' // [ꞎ] Latin Extended-D | |
| '\u{a791}' // [ꞑ] Latin Extended-D | |
| '\u{a793}'..'\u{a795}' // [ꞓ..ꞕ] Latin Extended-D | |
| '\u{a797}' // [ꞗ] Latin Extended-D | |
| '\u{a799}' // [ꞙ] Latin Extended-D | |
| '\u{a79b}' // [ꞛ] Latin Extended-D | |
| '\u{a79d}' // [ꞝ] Latin Extended-D | |
| '\u{a79f}' // [ꞟ] Latin Extended-D | |
| '\u{a7a1}' // [ꞡ] Latin Extended-D | |
| '\u{a7a3}' // [ꞣ] Latin Extended-D | |
| '\u{a7a5}' // [ꞥ] Latin Extended-D | |
| '\u{a7a7}' // [ꞧ] Latin Extended-D | |
| '\u{a7a9}' // [ꞩ] Latin Extended-D | |
| '\u{a7b5}' // [ꞵ] Latin Extended-D | |
| '\u{a7b7}' // [ꞷ] Latin Extended-D | |
| '\u{a7fa}' // [ꟺ] Latin Extended-D | |
| '\u{ab30}'..'\u{ab5a}' // [ꬰ..ꭚ] Latin Extended-E | |
| '\u{ab60}'..'\u{abbf}' // [ꭠ..ꮿ] Latin Extended-E | |
| '\u{fb00}'..'\u{fb17}' // [ff..ﬗ] Alphabetic Presentation Forms | |
| '\u{ff41}'..'\u{ff5a}' // [a..z] Halfwidth and Fullwidth Forms | |
| '\u{10428}'..'\u{1044f}' // [𐐨..𐑏] Deseret | |
| '\u{104d8}'..'\u{104fb}' // [𐓘..𐓻] Osage | |
| '\u{10cc0}'..'\u{10cf2}' // [𐳀..𐳲] Old Hungarian | |
| '\u{118c0}'..'\u{118df}' // [𑣀..𑣟] Warang Citi | |
| '\u{1d41a}'..'\u{1d433}' // [𝐚..𝐳] Mathematical Alphanumeric Symbols | |
| '\u{1d44e}'..'\u{1d467}' // [𝑎..𝑧] Mathematical Alphanumeric Symbols | |
| '\u{1d482}'..'\u{1d49b}' // [𝒂..𝒛] Mathematical Alphanumeric Symbols | |
| '\u{1d4b6}'..'\u{1d4cf}' // [𝒶..𝓏] Mathematical Alphanumeric Symbols | |
| '\u{1d4ea}'..'\u{1d503}' // [𝓪..𝔃] Mathematical Alphanumeric Symbols | |
| '\u{1d51e}'..'\u{1d537}' // [𝔞..𝔷] Mathematical Alphanumeric Symbols | |
| '\u{1d552}'..'\u{1d56b}' // [𝕒..𝕫] Mathematical Alphanumeric Symbols | |
| '\u{1d586}'..'\u{1d59f}' // [𝖆..𝖟] Mathematical Alphanumeric Symbols | |
| '\u{1d5ba}'..'\u{1d5d3}' // [𝖺..𝗓] Mathematical Alphanumeric Symbols | |
| '\u{1d5ee}'..'\u{1d607}' // [𝗮..𝘇] Mathematical Alphanumeric Symbols | |
| '\u{1d622}'..'\u{1d63b}' // [𝘢..𝘻] Mathematical Alphanumeric Symbols | |
| '\u{1d656}'..'\u{1d66f}' // [𝙖..𝙯] Mathematical Alphanumeric Symbols | |
| '\u{1d68a}'..'\u{1d6a5}' // [𝚊..𝚥] Mathematical Alphanumeric Symbols | |
| '\u{1d6c2}'..'\u{1d6da}' // [𝛂..𝛚] Mathematical Alphanumeric Symbols | |
| '\u{1d6dc}'..'\u{1d6e1}' // [𝛜..𝛡] Mathematical Alphanumeric Symbols | |
| '\u{1d6fc}'..'\u{1d714}' // [𝛼..𝜔] Mathematical Alphanumeric Symbols | |
| '\u{1d716}'..'\u{1d71b}' // [𝜖..𝜛] Mathematical Alphanumeric Symbols | |
| '\u{1d736}'..'\u{1d74e}' // [𝜶..𝝎] Mathematical Alphanumeric Symbols | |
| '\u{1d750}'..'\u{1d755}' // [𝝐..𝝕] Mathematical Alphanumeric Symbols | |
| '\u{1d770}'..'\u{1d788}' // [𝝰..𝞈] Mathematical Alphanumeric Symbols | |
| '\u{1d78a}'..'\u{1d78f}' // [𝞊..𝞏] Mathematical Alphanumeric Symbols | |
| '\u{1d7aa}'..'\u{1d7c2}' // [𝞪..𝟂] Mathematical Alphanumeric Symbols | |
| '\u{1d7c4}'..'\u{1d7c9}' // [𝟄..𝟉] Mathematical Alphanumeric Symbols | |
| '\u{1d7cb}' // [𝟋] Mathematical Alphanumeric Symbols | |
| '\u{1e922}'..'\u{1e943}' // [𞤢..𞥃] Adlam | |
; | |
CLASSIFY_Lm: // Modifier_Letter | |
'\u{02b0}'..'\u{02c1}' // [ʰ..ˁ] Spacing Modifier Letters | |
| '\u{02c6}'..'\u{02d1}' // [ˆ..ˑ] Spacing Modifier Letters | |
| '\u{02e0}'..'\u{02e4}' // [ˠ..ˤ] Spacing Modifier Letters | |
| '\u{02ec}' // [ˬ] Spacing Modifier Letters | |
| '\u{02ee}' // [ˮ] Spacing Modifier Letters | |
| '\u{0374}' // [ʹ] Greek and Coptic | |
| '\u{037a}' // [ͺ] Greek and Coptic | |
| '\u{0559}' // [ՙ] Armenian | |
| '\u{0640}' // [ـ] Arabic | |
| '\u{06e5}'..'\u{06e6}' // [ۥ..ۦ] Arabic | |
| '\u{07f4}'..'\u{07f5}' // [ߴ..ߵ] NKo | |
| '\u{07fa}' // [ߺ] NKo | |
| '\u{081a}' // [ࠚ] Samaritan | |
| '\u{0824}' // [ࠤ] Samaritan | |
| '\u{0828}' // [ࠨ] Samaritan | |
| '\u{0971}' // [ॱ] Devanagari | |
| '\u{0e46}' // [ๆ] Thai | |
| '\u{0ec6}' // [ໆ] Lao | |
| '\u{10fc}' // [ჼ] Georgian | |
| '\u{17d7}' // [ៗ] Khmer | |
| '\u{1843}' // [ᡃ] Mongolian | |
| '\u{1aa7}' // [ᪧ] Tai Tham | |
| '\u{1c78}'..'\u{1c7d}' // [ᱸ..ᱽ] Ol Chiki | |
| '\u{1d2c}'..'\u{1d6a}' // [ᴬ..ᵪ] Phonetic Extensions | |
| '\u{1d78}' // [ᵸ] Phonetic Extensions | |
| '\u{1d9b}'..'\u{1dbf}' // [ᶛ..ᶿ] Phonetic Extensions Supplement | |
| '\u{2071}' // [ⁱ] Superscripts and Subscripts | |
| '\u{207f}' // [ⁿ] Superscripts and Subscripts | |
| '\u{2090}'..'\u{209c}' // [ₐ..ₜ] Superscripts and Subscripts | |
| '\u{2c7c}'..'\u{2c7d}' // [ⱼ..ⱽ] Latin Extended-C | |
| '\u{2d6f}' // [ⵯ] Tifinagh | |
| '\u{2e2f}' // [ⸯ] Supplemental Punctuation | |
| '\u{3005}' // [々] CJK Symbols and Punctuation | |
| '\u{3031}'..'\u{3035}' // [〱..〵] CJK Symbols and Punctuation | |
| '\u{303b}' // [〻] CJK Symbols and Punctuation | |
| '\u{309d}'..'\u{309e}' // [ゝ..ゞ] Hiragana | |
| '\u{30fc}'..'\u{30fe}' // [ー..ヾ] Katakana | |
| '\u{a015}' // [ꀕ] Yi Syllables | |
| '\u{a4f8}'..'\u{a4fd}' // [ꓸ..ꓽ] Lisu | |
| '\u{a60c}' // [ꘌ] Vai | |
| '\u{a67f}' // [ꙿ] Cyrillic Extended-B | |
| '\u{a69c}'..'\u{a69d}' // [ꚜ..ꚝ] Cyrillic Extended-B | |
| '\u{a717}'..'\u{a71f}' // [ꜗ..ꜟ] Modifier Tone Letters | |
| '\u{a770}' // [ꝰ] Latin Extended-D | |
| '\u{a788}' // [ꞈ] Latin Extended-D | |
| '\u{a7f8}'..'\u{a7f9}' // [ꟸ..ꟹ] Latin Extended-D | |
| '\u{a9cf}' // [ꧏ] Javanese | |
| '\u{a9e6}' // [ꧦ] Myanmar Extended-B | |
| '\u{aa70}' // [ꩰ] Myanmar Extended-A | |
| '\u{aadd}' // [ꫝ] Tai Viet | |
| '\u{aaf3}'..'\u{aaf4}' // [ꫳ..ꫴ] Meetei Mayek Extensions | |
| '\u{ab5c}'..'\u{ab5f}' // [ꭜ..ꭟ] Latin Extended-E | |
| '\u{ff70}' // [ー] Halfwidth and Fullwidth Forms | |
| '\u{ff9e}'..'\u{ff9f}' // [゙..゚] Halfwidth and Fullwidth Forms | |
| '\u{16b40}'..'\u{16b43}' // [𖭀..𖭃] Pahawh Hmong | |
| '\u{16f93}'..'\u{16fe0}' // [𖾓..𖿠] Miao | |
; | |
CLASSIFY_Lo: // Other_Letter | |
'\u{00aa}' // [ª] Latin-1 Supplement | |
| '\u{00ba}' // [º] Latin-1 Supplement | |
| '\u{01bb}' // [ƻ] Latin Extended-B | |
| '\u{01c0}'..'\u{01c3}' // [ǀ..ǃ] Latin Extended-B | |
| '\u{0294}' // [ʔ] IPA Extensions | |
| '\u{05d0}'..'\u{05f2}' // [א..ײ] Hebrew | |
| '\u{0620}'..'\u{063f}' // [ؠ..ؿ] Arabic | |
| '\u{0641}'..'\u{064a}' // [ف..ي] Arabic | |
| '\u{066e}'..'\u{066f}' // [ٮ..ٯ] Arabic | |
| '\u{0671}'..'\u{06d3}' // [ٱ..ۓ] Arabic | |
| '\u{06d5}' // [ە] Arabic | |
| '\u{06ee}'..'\u{06ef}' // [ۮ..ۯ] Arabic | |
| '\u{06fa}'..'\u{06fc}' // [ۺ..ۼ] Arabic | |
| '\u{06ff}' // [ۿ] Arabic | |
| '\u{0710}' // [ܐ] Syriac | |
| '\u{0712}'..'\u{072f}' // [ܒ..ܯ] Syriac | |
| '\u{074d}'..'\u{07a5}' // [ݍ..ޥ] Syriac | |
| '\u{07b1}' // [ޱ] Thaana | |
| '\u{07ca}'..'\u{07ea}' // [ߊ..ߪ] NKo | |
| '\u{0800}'..'\u{0815}' // [ࠀ..ࠕ] Samaritan | |
| '\u{0840}'..'\u{0858}' // [ࡀ..ࡘ] Mandaic | |
| '\u{08a0}'..'\u{08bd}' // [ࢠ..ࢽ] Arabic Extended-A | |
| '\u{0904}'..'\u{0939}' // [ऄ..ह] Devanagari | |
| '\u{093d}' // [ऽ] Devanagari | |
| '\u{0950}' // [ॐ] Devanagari | |
| '\u{0958}'..'\u{0961}' // [क़..ॡ] Devanagari | |
| '\u{0972}'..'\u{0980}' // [ॲ..ঀ] Devanagari | |
| '\u{0985}'..'\u{09b9}' // [অ..হ] Bengali | |
| '\u{09bd}' // [ঽ] Bengali | |
| '\u{09ce}' // [ৎ] Bengali | |
| '\u{09dc}'..'\u{09e1}' // [ড়..ৡ] Bengali | |
| '\u{09f0}'..'\u{09f1}' // [ৰ..ৱ] Bengali | |
| '\u{0a05}'..'\u{0a39}' // [ਅ..ਹ] Gurmukhi | |
| '\u{0a59}'..'\u{0a5e}' // [ਖ਼..ਫ਼] Gurmukhi | |
| '\u{0a72}'..'\u{0a74}' // [ੲ..ੴ] Gurmukhi | |
| '\u{0a85}'..'\u{0ab9}' // [અ..હ] Gujarati | |
| '\u{0abd}' // [ઽ] Gujarati | |
| '\u{0ad0}'..'\u{0ae1}' // [ૐ..ૡ] Gujarati | |
| '\u{0af9}' // [ૹ] Gujarati | |
| '\u{0b05}'..'\u{0b39}' // [ଅ..ହ] Oriya | |
| '\u{0b3d}' // [ଽ] Oriya | |
| '\u{0b5c}'..'\u{0b61}' // [ଡ଼..ୡ] Oriya | |
| '\u{0b71}' // [ୱ] Oriya | |
| '\u{0b83}'..'\u{0bb9}' // [ஃ..ஹ] Tamil | |
| '\u{0bd0}' // [ௐ] Tamil | |
| '\u{0c05}'..'\u{0c3d}' // [అ..ఽ] Telugu | |
| '\u{0c58}'..'\u{0c61}' // [ౘ..ౡ] Telugu | |
| '\u{0c80}' // [ಀ] Kannada | |
| '\u{0c85}'..'\u{0cb9}' // [ಅ..ಹ] Kannada | |
| '\u{0cbd}' // [ಽ] Kannada | |
| '\u{0cde}'..'\u{0ce1}' // [ೞ..ೡ] Kannada | |
| '\u{0cf1}'..'\u{0cf2}' // [ೱ..ೲ] Kannada | |
| '\u{0d05}'..'\u{0d3d}' // [അ..ഽ] Malayalam | |
| '\u{0d4e}' // [ൎ] Malayalam | |
| '\u{0d54}'..'\u{0d56}' // [ൔ..ൖ] Malayalam | |
| '\u{0d5f}'..'\u{0d61}' // [ൟ..ൡ] Malayalam | |
| '\u{0d7a}'..'\u{0d7f}' // [ൺ..ൿ] Malayalam | |
| '\u{0d85}'..'\u{0dc6}' // [අ..ෆ] Sinhala | |
| '\u{0e01}'..'\u{0e30}' // [ก..ะ] Thai | |
| '\u{0e32}'..'\u{0e33}' // [า..ำ] Thai | |
| '\u{0e40}'..'\u{0e45}' // [เ..ๅ] Thai | |
| '\u{0e81}'..'\u{0eb0}' // [ກ..ະ] Lao | |
| '\u{0eb2}'..'\u{0eb3}' // [າ..ຳ] Lao | |
| '\u{0ebd}'..'\u{0ec4}' // [ຽ..ໄ] Lao | |
| '\u{0edc}'..'\u{0f00}' // [ໜ..ༀ] Lao | |
| '\u{0f40}'..'\u{0f6c}' // [ཀ..ཬ] Tibetan | |
| '\u{0f88}'..'\u{0f8c}' // [ྈ..ྌ] Tibetan | |
| '\u{1000}'..'\u{102a}' // [က..ဪ] Myanmar | |
| '\u{103f}' // [ဿ] Myanmar | |
| '\u{1050}'..'\u{1055}' // [ၐ..ၕ] Myanmar | |
| '\u{105a}'..'\u{105d}' // [ၚ..ၝ] Myanmar | |
| '\u{1061}' // [ၡ] Myanmar | |
| '\u{1065}'..'\u{1066}' // [ၥ..ၦ] Myanmar | |
| '\u{106e}'..'\u{1070}' // [ၮ..ၰ] Myanmar | |
| '\u{1075}'..'\u{1081}' // [ၵ..ႁ] Myanmar | |
| '\u{108e}' // [ႎ] Myanmar | |
| '\u{10d0}'..'\u{10fa}' // [ა..ჺ] Georgian | |
| '\u{10fd}'..'\u{135a}' // [ჽ..ፚ] Georgian | |
| '\u{1380}'..'\u{138f}' // [ᎀ..ᎏ] Ethiopic Supplement | |
| '\u{1401}'..'\u{166c}' // [ᐁ..ᙬ] Unified Canadian Aboriginal Syllabics | |
| '\u{166f}'..'\u{167f}' // [ᙯ..ᙿ] Unified Canadian Aboriginal Syllabics | |
| '\u{1681}'..'\u{169a}' // [ᚁ..ᚚ] Ogham | |
| '\u{16a0}'..'\u{16ea}' // [ᚠ..ᛪ] Runic | |
| '\u{16f1}'..'\u{1711}' // [ᛱ..ᜑ] Runic | |
| '\u{1720}'..'\u{1731}' // [ᜠ..ᜱ] Hanunoo | |
| '\u{1740}'..'\u{1751}' // [ᝀ..ᝑ] Buhid | |
| '\u{1760}'..'\u{1770}' // [ᝠ..ᝰ] Tagbanwa | |
| '\u{1780}'..'\u{17b3}' // [ក..ឳ] Khmer | |
| '\u{17dc}' // [ៜ] Khmer | |
| '\u{1820}'..'\u{1842}' // [ᠠ..ᡂ] Mongolian | |
| '\u{1844}'..'\u{1884}' // [ᡄ..ᢄ] Mongolian | |
| '\u{1887}'..'\u{18a8}' // [ᢇ..ᢨ] Mongolian | |
| '\u{18aa}'..'\u{191e}' // [ᢪ..ᤞ] Mongolian | |
| '\u{1950}'..'\u{19c9}' // [ᥐ..ᧉ] Tai Le | |
| '\u{1a00}'..'\u{1a16}' // [ᨀ..ᨖ] Buginese | |
| '\u{1a20}'..'\u{1a54}' // [ᨠ..ᩔ] Tai Tham | |
| '\u{1b05}'..'\u{1b33}' // [ᬅ..ᬳ] Balinese | |
| '\u{1b45}'..'\u{1b4b}' // [ᭅ..ᭋ] Balinese | |
| '\u{1b83}'..'\u{1ba0}' // [ᮃ..ᮠ] Sundanese | |
| '\u{1bae}'..'\u{1baf}' // [ᮮ..ᮯ] Sundanese | |
| '\u{1bba}'..'\u{1be5}' // [ᮺ..ᯥ] Sundanese | |
| '\u{1c00}'..'\u{1c23}' // [ᰀ..ᰣ] Lepcha | |
| '\u{1c4d}'..'\u{1c4f}' // [ᱍ..ᱏ] Lepcha | |
| '\u{1c5a}'..'\u{1c77}' // [ᱚ..ᱷ] Ol Chiki | |
| '\u{1ce9}'..'\u{1cec}' // [ᳩ..ᳬ] Vedic Extensions | |
| '\u{1cee}'..'\u{1cf1}' // [ᳮ..ᳱ] Vedic Extensions | |
| '\u{1cf5}'..'\u{1cf6}' // [ᳵ..ᳶ] Vedic Extensions | |
| '\u{2135}'..'\u{2138}' // [ℵ..ℸ] Letterlike Symbols | |
| '\u{2d30}'..'\u{2d67}' // [ⴰ..ⵧ] Tifinagh | |
| '\u{2d80}'..'\u{2dde}' // [ⶀ..ⷞ] Ethiopic Extended | |
| '\u{3006}' // [〆] CJK Symbols and Punctuation | |
| '\u{303c}' // [〼] CJK Symbols and Punctuation | |
| '\u{3041}'..'\u{3096}' // [ぁ..ゖ] Hiragana | |
| '\u{309f}' // [ゟ] Hiragana | |
| '\u{30a1}'..'\u{30fa}' // [ァ..ヺ] Katakana | |
| '\u{30ff}'..'\u{318e}' // [ヿ..ㆎ] Katakana | |
| '\u{31a0}'..'\u{31ba}' // [ㆠ..ㆺ] Bopomofo Extended | |
| '\u{31f0}'..'\u{31ff}' // [ㇰ..ㇿ] Katakana Phonetic Extensions | |
| '\u{3400}'..'\u{4db5}' // [㐀..䶵] CJK Unified Ideographs Extension A | |
| '\u{4e00}'..'\u{a014}' // [一..ꀔ] CJK Unified Ideographs | |
| '\u{a016}'..'\u{a48c}' // [ꀖ..ꒌ] Yi Syllables | |
| '\u{a4d0}'..'\u{a4f7}' // [ꓐ..ꓷ] Lisu | |
| '\u{a500}'..'\u{a60b}' // [ꔀ..ꘋ] Vai | |
| '\u{a610}'..'\u{a61f}' // [ꘐ..ꘟ] Vai | |
| '\u{a62a}'..'\u{a62b}' // [ꘪ..ꘫ] Vai | |
| '\u{a66e}' // [ꙮ] Cyrillic Extended-B | |
| '\u{a6a0}'..'\u{a6e5}' // [ꚠ..ꛥ] Bamum | |
| '\u{a78f}' // [ꞏ] Latin Extended-D | |
| '\u{a7f7}' // [ꟷ] Latin Extended-D | |
| '\u{a7fb}'..'\u{a801}' // [ꟻ..ꠁ] Latin Extended-D | |
| '\u{a803}'..'\u{a805}' // [ꠃ..ꠅ] Syloti Nagri | |
| '\u{a807}'..'\u{a80a}' // [ꠇ..ꠊ] Syloti Nagri | |
| '\u{a80c}'..'\u{a822}' // [ꠌ..ꠢ] Syloti Nagri | |
| '\u{a840}'..'\u{a873}' // [ꡀ..ꡳ] Phags-pa | |
| '\u{a882}'..'\u{a8b3}' // [ꢂ..ꢳ] Saurashtra | |
| '\u{a8f2}'..'\u{a8f7}' // [ꣲ..ꣷ] Devanagari Extended | |
| '\u{a8fb}' // [ꣻ] Devanagari Extended | |
| '\u{a8fd}' // [ꣽ] Devanagari Extended | |
| '\u{a90a}'..'\u{a925}' // [ꤊ..ꤥ] Kayah Li | |
| '\u{a930}'..'\u{a946}' // [ꤰ..ꥆ] Rejang | |
| '\u{a960}'..'\u{a97c}' // [ꥠ..ꥼ] Hangul Jamo Extended-A | |
| '\u{a984}'..'\u{a9b2}' // [ꦄ..ꦲ] Javanese | |
| '\u{a9e0}'..'\u{a9e4}' // [ꧠ..ꧤ] Myanmar Extended-B | |
| '\u{a9e7}'..'\u{a9ef}' // [ꧧ..ꧯ] Myanmar Extended-B | |
| '\u{a9fa}'..'\u{aa28}' // [ꧺ..ꨨ] Myanmar Extended-B | |
| '\u{aa40}'..'\u{aa42}' // [ꩀ..ꩂ] Cham | |
| '\u{aa44}'..'\u{aa4b}' // [ꩄ..ꩋ] Cham | |
| '\u{aa60}'..'\u{aa6f}' // [ꩠ..ꩯ] Myanmar Extended-A | |
| '\u{aa71}'..'\u{aa76}' // [ꩱ..ꩶ] Myanmar Extended-A | |
| '\u{aa7a}' // [ꩺ] Myanmar Extended-A | |
| '\u{aa7e}'..'\u{aaaf}' // [ꩾ..ꪯ] Myanmar Extended-A | |
| '\u{aab1}' // [ꪱ] Tai Viet | |
| '\u{aab5}'..'\u{aab6}' // [ꪵ..ꪶ] Tai Viet | |
| '\u{aab9}'..'\u{aabd}' // [ꪹ..ꪽ] Tai Viet | |
| '\u{aac0}' // [ꫀ] Tai Viet | |
| '\u{aac2}'..'\u{aadc}' // [ꫂ..ꫜ] Tai Viet | |
| '\u{aae0}'..'\u{aaea}' // [ꫠ..ꫪ] Meetei Mayek Extensions | |
| '\u{aaf2}' // [ꫲ] Meetei Mayek Extensions | |
| '\u{ab01}'..'\u{ab2e}' // [ꬁ..ꬮ] Ethiopic Extended-A | |
| '\u{abc0}'..'\u{abe2}' // [ꯀ..ꯢ] Meetei Mayek | |
| '\u{ac00}'..'\u{d7fb}' // [가..ퟻ] Hangul Syllables | |
| '\u{f900}'..'\u{fad9}' // [豈..龎] CJK Compatibility Ideographs | |
| '\u{fb1d}' // [יִ] Alphabetic Presentation Forms | |
| '\u{fb1f}'..'\u{fb28}' // [ײַ..ﬨ] Alphabetic Presentation Forms | |
| '\u{fb2a}'..'\u{fbb1}' // [שׁ..ﮱ] Alphabetic Presentation Forms | |
| '\u{fbd3}'..'\u{fd3d}' // [ﯓ..ﴽ] Arabic Presentation Forms-A | |
| '\u{fd50}'..'\u{fdfb}' // [ﵐ..ﷻ] Arabic Presentation Forms-A | |
| '\u{fe70}'..'\u{fefc}' // [ﹰ..ﻼ] Arabic Presentation Forms-B | |
| '\u{ff66}'..'\u{ff6f}' // [ヲ..ッ] Halfwidth and Fullwidth Forms | |
| '\u{ff71}'..'\u{ff9d}' // [ア..ン] Halfwidth and Fullwidth Forms | |
| '\u{ffa0}'..'\u{ffdc}' // [ᅠ..ᅵ] Halfwidth and Fullwidth Forms | |
| '\u{10000}'..'\u{100fa}' // [𐀀..𐃺] Linear B Syllabary | |
| '\u{10280}'..'\u{102d0}' // [𐊀..𐋐] Lycian | |
| '\u{10300}'..'\u{1031f}' // [𐌀..𐌟] Old Italic | |
| '\u{10330}'..'\u{10340}' // [𐌰..𐍀] Gothic | |
| '\u{10342}'..'\u{10349}' // [𐍂..𐍉] Gothic | |
| '\u{10350}'..'\u{10375}' // [𐍐..𐍵] Old Permic | |
| '\u{10380}'..'\u{1039d}' // [𐎀..𐎝] Ugaritic | |
| '\u{103a0}'..'\u{103cf}' // [𐎠..𐏏] Old Persian | |
| '\u{10450}'..'\u{1049d}' // [𐑐..𐒝] Shavian | |
| '\u{10500}'..'\u{10563}' // [𐔀..𐕣] Elbasan | |
| '\u{10600}'..'\u{10855}' // [𐘀..𐡕] Linear A | |
| '\u{10860}'..'\u{10876}' // [𐡠..𐡶] Palmyrene | |
| '\u{10880}'..'\u{1089e}' // [𐢀..𐢞] Nabataean | |
| '\u{108e0}'..'\u{108f5}' // [𐣠..𐣵] Hatran | |
| '\u{10900}'..'\u{10915}' // [𐤀..𐤕] Phoenician | |
| '\u{10920}'..'\u{10939}' // [𐤠..𐤹] Lydian | |
| '\u{10980}'..'\u{109b7}' // [𐦀..𐦷] Meroitic Hieroglyphs | |
| '\u{109be}'..'\u{109bf}' // [𐦾..𐦿] Meroitic Cursive | |
| '\u{10a00}' // [𐨀] Kharoshthi | |
| '\u{10a10}'..'\u{10a33}' // [𐨐..𐨳] Kharoshthi | |
| '\u{10a60}'..'\u{10a7c}' // [𐩠..𐩼] Old South Arabian | |
| '\u{10a80}'..'\u{10a9c}' // [𐪀..𐪜] Old North Arabian | |
| '\u{10ac0}'..'\u{10ac7}' // [𐫀..𐫇] Manichaean | |
| '\u{10ac9}'..'\u{10ae4}' // [𐫉..𐫤] Manichaean | |
| '\u{10b00}'..'\u{10b35}' // [𐬀..𐬵] Avestan | |
| '\u{10b40}'..'\u{10b55}' // [𐭀..𐭕] Inscriptional Parthian | |
| '\u{10b60}'..'\u{10b72}' // [𐭠..𐭲] Inscriptional Pahlavi | |
| '\u{10b80}'..'\u{10b91}' // [𐮀..𐮑] Psalter Pahlavi | |
| '\u{10c00}'..'\u{10c48}' // [𐰀..𐱈] Old Turkic | |
| '\u{11003}'..'\u{11037}' // [𑀃..𑀷] Brahmi | |
| '\u{11083}'..'\u{110af}' // [𑂃..𑂯] Kaithi | |
| '\u{110d0}'..'\u{110e8}' // [𑃐..𑃨] Sora Sompeng | |
| '\u{11103}'..'\u{11126}' // [𑄃..𑄦] Chakma | |
| '\u{11150}'..'\u{11172}' // [𑅐..𑅲] Mahajani | |
| '\u{11176}' // [𑅶] Mahajani | |
| '\u{11183}'..'\u{111b2}' // [𑆃..𑆲] Sharada | |
| '\u{111c1}'..'\u{111c4}' // [𑇁..𑇄] Sharada | |
| '\u{111da}' // [𑇚] Sharada | |
| '\u{111dc}' // [𑇜] Sharada | |
| '\u{11200}'..'\u{1122b}' // [𑈀..𑈫] Khojki | |
| '\u{11280}'..'\u{112a8}' // [𑊀..𑊨] Multani | |
| '\u{112b0}'..'\u{112de}' // [𑊰..𑋞] Khudawadi | |
| '\u{11305}'..'\u{11339}' // [𑌅..𑌹] Grantha | |
| '\u{1133d}' // [𑌽] Grantha | |
| '\u{11350}' // [𑍐] Grantha | |
| '\u{1135d}'..'\u{11361}' // [𑍝..𑍡] Grantha | |
| '\u{11400}'..'\u{11434}' // [𑐀..𑐴] Newa | |
| '\u{11447}'..'\u{1144a}' // [𑑇..𑑊] Newa | |
| '\u{11480}'..'\u{114af}' // [𑒀..𑒯] Tirhuta | |
| '\u{114c4}'..'\u{114c5}' // [𑓄..𑓅] Tirhuta | |
| '\u{114c7}' // [𑓇] Tirhuta | |
| '\u{11580}'..'\u{115ae}' // [𑖀..𑖮] Siddham | |
| '\u{115d8}'..'\u{115db}' // [𑗘..𑗛] Siddham | |
| '\u{11600}'..'\u{1162f}' // [𑘀..𑘯] Modi | |
| '\u{11644}' // [𑙄] Modi | |
| '\u{11680}'..'\u{116aa}' // [𑚀..𑚪] Takri | |
| '\u{11700}'..'\u{11719}' // [𑜀..𑜙] Ahom | |
| '\u{118ff}'..'\u{11c2e}' // [𑣿..𑰮] Warang Citi | |
| '\u{11c40}' // [𑱀] Bhaiksuki | |
| '\u{11c72}'..'\u{11c8f}' // [𑱲..𑲏] Marchen | |
| '\u{12000}'..'\u{12399}' // [𒀀..𒎙] Cuneiform | |
| '\u{12480}'..'\u{16a5e}' // [𒒀..𖩞] Early Dynastic Cuneiform | |
| '\u{16ad0}'..'\u{16aed}' // [𖫐..𖫭] Bassa Vah | |
| '\u{16b00}'..'\u{16b2f}' // [𖬀..𖬯] Pahawh Hmong | |
| '\u{16b63}'..'\u{16f50}' // [𖭣..𖽐] Pahawh Hmong | |
| '\u{17000}'..'\u{1bc99}' // [𗀀..𛲙] Tangut | |
| '\u{1e800}'..'\u{1e8c4}' // [𞠀..𞣄] Mende Kikakui | |
| '\u{1ee00}'..'\u{1eebb}' // [𞸀..𞺻] Arabic Mathematical Alphabetic Symbols | |
| '\u{20000}'..'\u{2fa1d}' // [𠀀..𪘀] CJK Unified Ideographs Extension B | |
; | |
CLASSIFY_Lt: // Titlecase_Letter | |
'\u{01c5}' // [Dž] Latin Extended-B | |
| '\u{01c8}' // [Lj] Latin Extended-B | |
| '\u{01cb}' // [Nj] Latin Extended-B | |
| '\u{01f2}' // [Dz] Latin Extended-B | |
| '\u{1f88}'..'\u{1f8f}' // [ᾈ..ᾏ] Greek Extended | |
| '\u{1f98}'..'\u{1f9f}' // [ᾘ..ᾟ] Greek Extended | |
| '\u{1fa8}'..'\u{1faf}' // [ᾨ..ᾯ] Greek Extended | |
| '\u{1fbc}' // [ᾼ] Greek Extended | |
| '\u{1fcc}' // [ῌ] Greek Extended | |
| '\u{1ffc}' // [ῼ] Greek Extended | |
; | |
CLASSIFY_Lu: // Uppercase_Letter | |
'\u{0041}'..'\u{005a}' // [A..Z] Basic Latin | |
| '\u{00c0}'..'\u{00d6}' // [À..Ö] Latin-1 Supplement | |
| '\u{00d8}'..'\u{00de}' // [Ø..Þ] Latin-1 Supplement | |
| '\u{0100}' // [Ā] Latin Extended-A | |
| '\u{0102}' // [Ă] Latin Extended-A | |
| '\u{0104}' // [Ą] Latin Extended-A | |
| '\u{0106}' // [Ć] Latin Extended-A | |
| '\u{0108}' // [Ĉ] Latin Extended-A | |
| '\u{010a}' // [Ċ] Latin Extended-A | |
| '\u{010c}' // [Č] Latin Extended-A | |
| '\u{010e}' // [Ď] Latin Extended-A | |
| '\u{0110}' // [Đ] Latin Extended-A | |
| '\u{0112}' // [Ē] Latin Extended-A | |
| '\u{0114}' // [Ĕ] Latin Extended-A | |
| '\u{0116}' // [Ė] Latin Extended-A | |
| '\u{0118}' // [Ę] Latin Extended-A | |
| '\u{011a}' // [Ě] Latin Extended-A | |
| '\u{011c}' // [Ĝ] Latin Extended-A | |
| '\u{011e}' // [Ğ] Latin Extended-A | |
| '\u{0120}' // [Ġ] Latin Extended-A | |
| '\u{0122}' // [Ģ] Latin Extended-A | |
| '\u{0124}' // [Ĥ] Latin Extended-A | |
| '\u{0126}' // [Ħ] Latin Extended-A | |
| '\u{0128}' // [Ĩ] Latin Extended-A | |
| '\u{012a}' // [Ī] Latin Extended-A | |
| '\u{012c}' // [Ĭ] Latin Extended-A | |
| '\u{012e}' // [Į] Latin Extended-A | |
| '\u{0130}' // [İ] Latin Extended-A | |
| '\u{0132}' // [IJ] Latin Extended-A | |
| '\u{0134}' // [Ĵ] Latin Extended-A | |
| '\u{0136}' // [Ķ] Latin Extended-A | |
| '\u{0139}' // [Ĺ] Latin Extended-A | |
| '\u{013b}' // [Ļ] Latin Extended-A | |
| '\u{013d}' // [Ľ] Latin Extended-A | |
| '\u{013f}' // [Ŀ] Latin Extended-A | |
| '\u{0141}' // [Ł] Latin Extended-A | |
| '\u{0143}' // [Ń] Latin Extended-A | |
| '\u{0145}' // [Ņ] Latin Extended-A | |
| '\u{0147}' // [Ň] Latin Extended-A | |
| '\u{014a}' // [Ŋ] Latin Extended-A | |
| '\u{014c}' // [Ō] Latin Extended-A | |
| '\u{014e}' // [Ŏ] Latin Extended-A | |
| '\u{0150}' // [Ő] Latin Extended-A | |
| '\u{0152}' // [Œ] Latin Extended-A | |
| '\u{0154}' // [Ŕ] Latin Extended-A | |
| '\u{0156}' // [Ŗ] Latin Extended-A | |
| '\u{0158}' // [Ř] Latin Extended-A | |
| '\u{015a}' // [Ś] Latin Extended-A | |
| '\u{015c}' // [Ŝ] Latin Extended-A | |
| '\u{015e}' // [Ş] Latin Extended-A | |
| '\u{0160}' // [Š] Latin Extended-A | |
| '\u{0162}' // [Ţ] Latin Extended-A | |
| '\u{0164}' // [Ť] Latin Extended-A | |
| '\u{0166}' // [Ŧ] Latin Extended-A | |
| '\u{0168}' // [Ũ] Latin Extended-A | |
| '\u{016a}' // [Ū] Latin Extended-A | |
| '\u{016c}' // [Ŭ] Latin Extended-A | |
| '\u{016e}' // [Ů] Latin Extended-A | |
| '\u{0170}' // [Ű] Latin Extended-A | |
| '\u{0172}' // [Ų] Latin Extended-A | |
| '\u{0174}' // [Ŵ] Latin Extended-A | |
| '\u{0176}' // [Ŷ] Latin Extended-A | |
| '\u{0178}'..'\u{0179}' // [Ÿ..Ź] Latin Extended-A | |
| '\u{017b}' // [Ż] Latin Extended-A | |
| '\u{017d}' // [Ž] Latin Extended-A | |
| '\u{0181}'..'\u{0182}' // [Ɓ..Ƃ] Latin Extended-B | |
| '\u{0184}' // [Ƅ] Latin Extended-B | |
| '\u{0186}'..'\u{0187}' // [Ɔ..Ƈ] Latin Extended-B | |
| '\u{0189}'..'\u{018b}' // [Ɖ..Ƌ] Latin Extended-B | |
| '\u{018e}'..'\u{0191}' // [Ǝ..Ƒ] Latin Extended-B | |
| '\u{0193}'..'\u{0194}' // [Ɠ..Ɣ] Latin Extended-B | |
| '\u{0196}'..'\u{0198}' // [Ɩ..Ƙ] Latin Extended-B | |
| '\u{019c}'..'\u{019d}' // [Ɯ..Ɲ] Latin Extended-B | |
| '\u{019f}'..'\u{01a0}' // [Ɵ..Ơ] Latin Extended-B | |
| '\u{01a2}' // [Ƣ] Latin Extended-B | |
| '\u{01a4}' // [Ƥ] Latin Extended-B | |
| '\u{01a6}'..'\u{01a7}' // [Ʀ..Ƨ] Latin Extended-B | |
| '\u{01a9}' // [Ʃ] Latin Extended-B | |
| '\u{01ac}' // [Ƭ] Latin Extended-B | |
| '\u{01ae}'..'\u{01af}' // [Ʈ..Ư] Latin Extended-B | |
| '\u{01b1}'..'\u{01b3}' // [Ʊ..Ƴ] Latin Extended-B | |
| '\u{01b5}' // [Ƶ] Latin Extended-B | |
| '\u{01b7}'..'\u{01b8}' // [Ʒ..Ƹ] Latin Extended-B | |
| '\u{01bc}' // [Ƽ] Latin Extended-B | |
| '\u{01c4}' // [DŽ] Latin Extended-B | |
| '\u{01c7}' // [LJ] Latin Extended-B | |
| '\u{01ca}' // [NJ] Latin Extended-B | |
| '\u{01cd}' // [Ǎ] Latin Extended-B | |
| '\u{01cf}' // [Ǐ] Latin Extended-B | |
| '\u{01d1}' // [Ǒ] Latin Extended-B | |
| '\u{01d3}' // [Ǔ] Latin Extended-B | |
| '\u{01d5}' // [Ǖ] Latin Extended-B | |
| '\u{01d7}' // [Ǘ] Latin Extended-B | |
| '\u{01d9}' // [Ǚ] Latin Extended-B | |
| '\u{01db}' // [Ǜ] Latin Extended-B | |
| '\u{01de}' // [Ǟ] Latin Extended-B | |
| '\u{01e0}' // [Ǡ] Latin Extended-B | |
| '\u{01e2}' // [Ǣ] Latin Extended-B | |
| '\u{01e4}' // [Ǥ] Latin Extended-B | |
| '\u{01e6}' // [Ǧ] Latin Extended-B | |
| '\u{01e8}' // [Ǩ] Latin Extended-B | |
| '\u{01ea}' // [Ǫ] Latin Extended-B | |
| '\u{01ec}' // [Ǭ] Latin Extended-B | |
| '\u{01ee}' // [Ǯ] Latin Extended-B | |
| '\u{01f1}' // [DZ] Latin Extended-B | |
| '\u{01f4}' // [Ǵ] Latin Extended-B | |
| '\u{01f6}'..'\u{01f8}' // [Ƕ..Ǹ] Latin Extended-B | |
| '\u{01fa}' // [Ǻ] Latin Extended-B | |
| '\u{01fc}' // [Ǽ] Latin Extended-B | |
| '\u{01fe}' // [Ǿ] Latin Extended-B | |
| '\u{0200}' // [Ȁ] Latin Extended-B | |
| '\u{0202}' // [Ȃ] Latin Extended-B | |
| '\u{0204}' // [Ȅ] Latin Extended-B | |
| '\u{0206}' // [Ȇ] Latin Extended-B | |
| '\u{0208}' // [Ȉ] Latin Extended-B | |
| '\u{020a}' // [Ȋ] Latin Extended-B | |
| '\u{020c}' // [Ȍ] Latin Extended-B | |
| '\u{020e}' // [Ȏ] Latin Extended-B | |
| '\u{0210}' // [Ȑ] Latin Extended-B | |
| '\u{0212}' // [Ȓ] Latin Extended-B | |
| '\u{0214}' // [Ȕ] Latin Extended-B | |
| '\u{0216}' // [Ȗ] Latin Extended-B | |
| '\u{0218}' // [Ș] Latin Extended-B | |
| '\u{021a}' // [Ț] Latin Extended-B | |
| '\u{021c}' // [Ȝ] Latin Extended-B | |
| '\u{021e}' // [Ȟ] Latin Extended-B | |
| '\u{0220}' // [Ƞ] Latin Extended-B | |
| '\u{0222}' // [Ȣ] Latin Extended-B | |
| '\u{0224}' // [Ȥ] Latin Extended-B | |
| '\u{0226}' // [Ȧ] Latin Extended-B | |
| '\u{0228}' // [Ȩ] Latin Extended-B | |
| '\u{022a}' // [Ȫ] Latin Extended-B | |
| '\u{022c}' // [Ȭ] Latin Extended-B | |
| '\u{022e}' // [Ȯ] Latin Extended-B | |
| '\u{0230}' // [Ȱ] Latin Extended-B | |
| '\u{0232}' // [Ȳ] Latin Extended-B | |
| '\u{023a}'..'\u{023b}' // [Ⱥ..Ȼ] Latin Extended-B | |
| '\u{023d}'..'\u{023e}' // [Ƚ..Ⱦ] Latin Extended-B | |
| '\u{0241}' // [Ɂ] Latin Extended-B | |
| '\u{0243}'..'\u{0246}' // [Ƀ..Ɇ] Latin Extended-B | |
| '\u{0248}' // [Ɉ] Latin Extended-B | |
| '\u{024a}' // [Ɋ] Latin Extended-B | |
| '\u{024c}' // [Ɍ] Latin Extended-B | |
| '\u{024e}' // [Ɏ] Latin Extended-B | |
| '\u{0370}' // [Ͱ] Greek and Coptic | |
| '\u{0372}' // [Ͳ] Greek and Coptic | |
| '\u{0376}' // [Ͷ] Greek and Coptic | |
| '\u{037f}' // [Ϳ] Greek and Coptic | |
| '\u{0386}' // [Ά] Greek and Coptic | |
| '\u{0388}'..'\u{038f}' // [Έ..Ώ] Greek and Coptic | |
| '\u{0391}'..'\u{03ab}' // [Α..Ϋ] Greek and Coptic | |
| '\u{03cf}' // [Ϗ] Greek and Coptic | |
| '\u{03d2}'..'\u{03d4}' // [ϒ..ϔ] Greek and Coptic | |
| '\u{03d8}' // [Ϙ] Greek and Coptic | |
| '\u{03da}' // [Ϛ] Greek and Coptic | |
| '\u{03dc}' // [Ϝ] Greek and Coptic | |
| '\u{03de}' // [Ϟ] Greek and Coptic | |
| '\u{03e0}' // [Ϡ] Greek and Coptic | |
| '\u{03e2}' // [Ϣ] Greek and Coptic | |
| '\u{03e4}' // [Ϥ] Greek and Coptic | |
| '\u{03e6}' // [Ϧ] Greek and Coptic | |
| '\u{03e8}' // [Ϩ] Greek and Coptic | |
| '\u{03ea}' // [Ϫ] Greek and Coptic | |
| '\u{03ec}' // [Ϭ] Greek and Coptic | |
| '\u{03ee}' // [Ϯ] Greek and Coptic | |
| '\u{03f4}' // [ϴ] Greek and Coptic | |
| '\u{03f7}' // [Ϸ] Greek and Coptic | |
| '\u{03f9}'..'\u{03fa}' // [Ϲ..Ϻ] Greek and Coptic | |
| '\u{03fd}'..'\u{042f}' // [Ͻ..Я] Greek and Coptic | |
| '\u{0460}' // [Ѡ] Cyrillic | |
| '\u{0462}' // [Ѣ] Cyrillic | |
| '\u{0464}' // [Ѥ] Cyrillic | |
| '\u{0466}' // [Ѧ] Cyrillic | |
| '\u{0468}' // [Ѩ] Cyrillic | |
| '\u{046a}' // [Ѫ] Cyrillic | |
| '\u{046c}' // [Ѭ] Cyrillic | |
| '\u{046e}' // [Ѯ] Cyrillic | |
| '\u{0470}' // [Ѱ] Cyrillic | |
| '\u{0472}' // [Ѳ] Cyrillic | |
| '\u{0474}' // [Ѵ] Cyrillic | |
| '\u{0476}' // [Ѷ] Cyrillic | |
| '\u{0478}' // [Ѹ] Cyrillic | |
| '\u{047a}' // [Ѻ] Cyrillic | |
| '\u{047c}' // [Ѽ] Cyrillic | |
| '\u{047e}' // [Ѿ] Cyrillic | |
| '\u{0480}' // [Ҁ] Cyrillic | |
| '\u{048a}' // [Ҋ] Cyrillic | |
| '\u{048c}' // [Ҍ] Cyrillic | |
| '\u{048e}' // [Ҏ] Cyrillic | |
| '\u{0490}' // [Ґ] Cyrillic | |
| '\u{0492}' // [Ғ] Cyrillic | |
| '\u{0494}' // [Ҕ] Cyrillic | |
| '\u{0496}' // [Җ] Cyrillic | |
| '\u{0498}' // [Ҙ] Cyrillic | |
| '\u{049a}' // [Қ] Cyrillic | |
| '\u{049c}' // [Ҝ] Cyrillic | |
| '\u{049e}' // [Ҟ] Cyrillic | |
| '\u{04a0}' // [Ҡ] Cyrillic | |
| '\u{04a2}' // [Ң] Cyrillic | |
| '\u{04a4}' // [Ҥ] Cyrillic | |
| '\u{04a6}' // [Ҧ] Cyrillic | |
| '\u{04a8}' // [Ҩ] Cyrillic | |
| '\u{04aa}' // [Ҫ] Cyrillic | |
| '\u{04ac}' // [Ҭ] Cyrillic | |
| '\u{04ae}' // [Ү] Cyrillic | |
| '\u{04b0}' // [Ұ] Cyrillic | |
| '\u{04b2}' // [Ҳ] Cyrillic | |
| '\u{04b4}' // [Ҵ] Cyrillic | |
| '\u{04b6}' // [Ҷ] Cyrillic | |
| '\u{04b8}' // [Ҹ] Cyrillic | |
| '\u{04ba}' // [Һ] Cyrillic | |
| '\u{04bc}' // [Ҽ] Cyrillic | |
| '\u{04be}' // [Ҿ] Cyrillic | |
| '\u{04c0}'..'\u{04c1}' // [Ӏ..Ӂ] Cyrillic | |
| '\u{04c3}' // [Ӄ] Cyrillic | |
| '\u{04c5}' // [Ӆ] Cyrillic | |
| '\u{04c7}' // [Ӈ] Cyrillic | |
| '\u{04c9}' // [Ӊ] Cyrillic | |
| '\u{04cb}' // [Ӌ] Cyrillic | |
| '\u{04cd}' // [Ӎ] Cyrillic | |
| '\u{04d0}' // [Ӑ] Cyrillic | |
| '\u{04d2}' // [Ӓ] Cyrillic | |
| '\u{04d4}' // [Ӕ] Cyrillic | |
| '\u{04d6}' // [Ӗ] Cyrillic | |
| '\u{04d8}' // [Ә] Cyrillic | |
| '\u{04da}' // [Ӛ] Cyrillic | |
| '\u{04dc}' // [Ӝ] Cyrillic | |
| '\u{04de}' // [Ӟ] Cyrillic | |
| '\u{04e0}' // [Ӡ] Cyrillic | |
| '\u{04e2}' // [Ӣ] Cyrillic | |
| '\u{04e4}' // [Ӥ] Cyrillic | |
| '\u{04e6}' // [Ӧ] Cyrillic | |
| '\u{04e8}' // [Ө] Cyrillic | |
| '\u{04ea}' // [Ӫ] Cyrillic | |
| '\u{04ec}' // [Ӭ] Cyrillic | |
| '\u{04ee}' // [Ӯ] Cyrillic | |
| '\u{04f0}' // [Ӱ] Cyrillic | |
| '\u{04f2}' // [Ӳ] Cyrillic | |
| '\u{04f4}' // [Ӵ] Cyrillic | |
| '\u{04f6}' // [Ӷ] Cyrillic | |
| '\u{04f8}' // [Ӹ] Cyrillic | |
| '\u{04fa}' // [Ӻ] Cyrillic | |
| '\u{04fc}' // [Ӽ] Cyrillic | |
| '\u{04fe}' // [Ӿ] Cyrillic | |
| '\u{0500}' // [Ԁ] Cyrillic Supplement | |
| '\u{0502}' // [Ԃ] Cyrillic Supplement | |
| '\u{0504}' // [Ԅ] Cyrillic Supplement | |
| '\u{0506}' // [Ԇ] Cyrillic Supplement | |
| '\u{0508}' // [Ԉ] Cyrillic Supplement | |
| '\u{050a}' // [Ԋ] Cyrillic Supplement | |
| '\u{050c}' // [Ԍ] Cyrillic Supplement | |
| '\u{050e}' // [Ԏ] Cyrillic Supplement | |
| '\u{0510}' // [Ԑ] Cyrillic Supplement | |
| '\u{0512}' // [Ԓ] Cyrillic Supplement | |
| '\u{0514}' // [Ԕ] Cyrillic Supplement | |
| '\u{0516}' // [Ԗ] Cyrillic Supplement | |
| '\u{0518}' // [Ԙ] Cyrillic Supplement | |
| '\u{051a}' // [Ԛ] Cyrillic Supplement | |
| '\u{051c}' // [Ԝ] Cyrillic Supplement | |
| '\u{051e}' // [Ԟ] Cyrillic Supplement | |
| '\u{0520}' // [Ԡ] Cyrillic Supplement | |
| '\u{0522}' // [Ԣ] Cyrillic Supplement | |
| '\u{0524}' // [Ԥ] Cyrillic Supplement | |
| '\u{0526}' // [Ԧ] Cyrillic Supplement | |
| '\u{0528}' // [Ԩ] Cyrillic Supplement | |
| '\u{052a}' // [Ԫ] Cyrillic Supplement | |
| '\u{052c}' // [Ԭ] Cyrillic Supplement | |
| '\u{052e}' // [Ԯ] Cyrillic Supplement | |
| '\u{0531}'..'\u{0556}' // [Ա..Ֆ] Armenian | |
| '\u{10a0}'..'\u{10cd}' // [Ⴀ..Ⴭ] Georgian | |
| '\u{13a0}'..'\u{13f5}' // [Ꭰ..Ᏽ] Cherokee | |
| '\u{1e00}' // [Ḁ] Latin Extended Additional | |
| '\u{1e02}' // [Ḃ] Latin Extended Additional | |
| '\u{1e04}' // [Ḅ] Latin Extended Additional | |
| '\u{1e06}' // [Ḇ] Latin Extended Additional | |
| '\u{1e08}' // [Ḉ] Latin Extended Additional | |
| '\u{1e0a}' // [Ḋ] Latin Extended Additional | |
| '\u{1e0c}' // [Ḍ] Latin Extended Additional | |
| '\u{1e0e}' // [Ḏ] Latin Extended Additional | |
| '\u{1e10}' // [Ḑ] Latin Extended Additional | |
| '\u{1e12}' // [Ḓ] Latin Extended Additional | |
| '\u{1e14}' // [Ḕ] Latin Extended Additional | |
| '\u{1e16}' // [Ḗ] Latin Extended Additional | |
| '\u{1e18}' // [Ḙ] Latin Extended Additional | |
| '\u{1e1a}' // [Ḛ] Latin Extended Additional | |
| '\u{1e1c}' // [Ḝ] Latin Extended Additional | |
| '\u{1e1e}' // [Ḟ] Latin Extended Additional | |
| '\u{1e20}' // [Ḡ] Latin Extended Additional | |
| '\u{1e22}' // [Ḣ] Latin Extended Additional | |
| '\u{1e24}' // [Ḥ] Latin Extended Additional | |
| '\u{1e26}' // [Ḧ] Latin Extended Additional | |
| '\u{1e28}' // [Ḩ] Latin Extended Additional | |
| '\u{1e2a}' // [Ḫ] Latin Extended Additional | |
| '\u{1e2c}' // [Ḭ] Latin Extended Additional | |
| '\u{1e2e}' // [Ḯ] Latin Extended Additional | |
| '\u{1e30}' // [Ḱ] Latin Extended Additional | |
| '\u{1e32}' // [Ḳ] Latin Extended Additional | |
| '\u{1e34}' // [Ḵ] Latin Extended Additional | |
| '\u{1e36}' // [Ḷ] Latin Extended Additional | |
| '\u{1e38}' // [Ḹ] Latin Extended Additional | |
| '\u{1e3a}' // [Ḻ] Latin Extended Additional | |
| '\u{1e3c}' // [Ḽ] Latin Extended Additional | |
| '\u{1e3e}' // [Ḿ] Latin Extended Additional | |
| '\u{1e40}' // [Ṁ] Latin Extended Additional | |
| '\u{1e42}' // [Ṃ] Latin Extended Additional | |
| '\u{1e44}' // [Ṅ] Latin Extended Additional | |
| '\u{1e46}' // [Ṇ] Latin Extended Additional | |
| '\u{1e48}' // [Ṉ] Latin Extended Additional | |
| '\u{1e4a}' // [Ṋ] Latin Extended Additional | |
| '\u{1e4c}' // [Ṍ] Latin Extended Additional | |
| '\u{1e4e}' // [Ṏ] Latin Extended Additional | |
| '\u{1e50}' // [Ṑ] Latin Extended Additional | |
| '\u{1e52}' // [Ṓ] Latin Extended Additional | |
| '\u{1e54}' // [Ṕ] Latin Extended Additional | |
| '\u{1e56}' // [Ṗ] Latin Extended Additional | |
| '\u{1e58}' // [Ṙ] Latin Extended Additional | |
| '\u{1e5a}' // [Ṛ] Latin Extended Additional | |
| '\u{1e5c}' // [Ṝ] Latin Extended Additional | |
| '\u{1e5e}' // [Ṟ] Latin Extended Additional | |
| '\u{1e60}' // [Ṡ] Latin Extended Additional | |
| '\u{1e62}' // [Ṣ] Latin Extended Additional | |
| '\u{1e64}' // [Ṥ] Latin Extended Additional | |
| '\u{1e66}' // [Ṧ] Latin Extended Additional | |
| '\u{1e68}' // [Ṩ] Latin Extended Additional | |
| '\u{1e6a}' // [Ṫ] Latin Extended Additional | |
| '\u{1e6c}' // [Ṭ] Latin Extended Additional | |
| '\u{1e6e}' // [Ṯ] Latin Extended Additional | |
| '\u{1e70}' // [Ṱ] Latin Extended Additional | |
| '\u{1e72}' // [Ṳ] Latin Extended Additional | |
| '\u{1e74}' // [Ṵ] Latin Extended Additional | |
| '\u{1e76}' // [Ṷ] Latin Extended Additional | |
| '\u{1e78}' // [Ṹ] Latin Extended Additional | |
| '\u{1e7a}' // [Ṻ] Latin Extended Additional | |
| '\u{1e7c}' // [Ṽ] Latin Extended Additional | |
| '\u{1e7e}' // [Ṿ] Latin Extended Additional | |
| '\u{1e80}' // [Ẁ] Latin Extended Additional | |
| '\u{1e82}' // [Ẃ] Latin Extended Additional | |
| '\u{1e84}' // [Ẅ] Latin Extended Additional | |
| '\u{1e86}' // [Ẇ] Latin Extended Additional | |
| '\u{1e88}' // [Ẉ] Latin Extended Additional | |
| '\u{1e8a}' // [Ẋ] Latin Extended Additional | |
| '\u{1e8c}' // [Ẍ] Latin Extended Additional | |
| '\u{1e8e}' // [Ẏ] Latin Extended Additional | |
| '\u{1e90}' // [Ẑ] Latin Extended Additional | |
| '\u{1e92}' // [Ẓ] Latin Extended Additional | |
| '\u{1e94}' // [Ẕ] Latin Extended Additional | |
| '\u{1e9e}' // [ẞ] Latin Extended Additional | |
| '\u{1ea0}' // [Ạ] Latin Extended Additional | |
| '\u{1ea2}' // [Ả] Latin Extended Additional | |
| '\u{1ea4}' // [Ấ] Latin Extended Additional | |
| '\u{1ea6}' // [Ầ] Latin Extended Additional | |
| '\u{1ea8}' // [Ẩ] Latin Extended Additional | |
| '\u{1eaa}' // [Ẫ] Latin Extended Additional | |
| '\u{1eac}' // [Ậ] Latin Extended Additional | |
| '\u{1eae}' // [Ắ] Latin Extended Additional | |
| '\u{1eb0}' // [Ằ] Latin Extended Additional | |
| '\u{1eb2}' // [Ẳ] Latin Extended Additional | |
| '\u{1eb4}' // [Ẵ] Latin Extended Additional | |
| '\u{1eb6}' // [Ặ] Latin Extended Additional | |
| '\u{1eb8}' // [Ẹ] Latin Extended Additional | |
| '\u{1eba}' // [Ẻ] Latin Extended Additional | |
| '\u{1ebc}' // [Ẽ] Latin Extended Additional | |
| '\u{1ebe}' // [Ế] Latin Extended Additional | |
| '\u{1ec0}' // [Ề] Latin Extended Additional | |
| '\u{1ec2}' // [Ể] Latin Extended Additional | |
| '\u{1ec4}' // [Ễ] Latin Extended Additional | |
| '\u{1ec6}' // [Ệ] Latin Extended Additional | |
| '\u{1ec8}' // [Ỉ] Latin Extended Additional | |
| '\u{1eca}' // [Ị] Latin Extended Additional | |
| '\u{1ecc}' // [Ọ] Latin Extended Additional | |
| '\u{1ece}' // [Ỏ] Latin Extended Additional | |
| '\u{1ed0}' // [Ố] Latin Extended Additional | |
| '\u{1ed2}' // [Ồ] Latin Extended Additional | |
| '\u{1ed4}' // [Ổ] Latin Extended Additional | |
| '\u{1ed6}' // [Ỗ] Latin Extended Additional | |
| '\u{1ed8}' // [Ộ] Latin Extended Additional | |
| '\u{1eda}' // [Ớ] Latin Extended Additional | |
| '\u{1edc}' // [Ờ] Latin Extended Additional | |
| '\u{1ede}' // [Ở] Latin Extended Additional | |
| '\u{1ee0}' // [Ỡ] Latin Extended Additional | |
| '\u{1ee2}' // [Ợ] Latin Extended Additional | |
| '\u{1ee4}' // [Ụ] Latin Extended Additional | |
| '\u{1ee6}' // [Ủ] Latin Extended Additional | |
| '\u{1ee8}' // [Ứ] Latin Extended Additional | |
| '\u{1eea}' // [Ừ] Latin Extended Additional | |
| '\u{1eec}' // [Ử] Latin Extended Additional | |
| '\u{1eee}' // [Ữ] Latin Extended Additional | |
| '\u{1ef0}' // [Ự] Latin Extended Additional | |
| '\u{1ef2}' // [Ỳ] Latin Extended Additional | |
| '\u{1ef4}' // [Ỵ] Latin Extended Additional | |
| '\u{1ef6}' // [Ỷ] Latin Extended Additional | |
| '\u{1ef8}' // [Ỹ] Latin Extended Additional | |
| '\u{1efa}' // [Ỻ] Latin Extended Additional | |
| '\u{1efc}' // [Ỽ] Latin Extended Additional | |
| '\u{1efe}' // [Ỿ] Latin Extended Additional | |
| '\u{1f08}'..'\u{1f0f}' // [Ἀ..Ἇ] Greek Extended | |
| '\u{1f18}'..'\u{1f1d}' // [Ἐ..Ἕ] Greek Extended | |
| '\u{1f28}'..'\u{1f2f}' // [Ἠ..Ἧ] Greek Extended | |
| '\u{1f38}'..'\u{1f3f}' // [Ἰ..Ἷ] Greek Extended | |
| '\u{1f48}'..'\u{1f4d}' // [Ὀ..Ὅ] Greek Extended | |
| '\u{1f59}'..'\u{1f5f}' // [Ὑ..Ὗ] Greek Extended | |
| '\u{1f68}'..'\u{1f6f}' // [Ὠ..Ὧ] Greek Extended | |
| '\u{1fb8}'..'\u{1fbb}' // [Ᾰ..Ά] Greek Extended | |
| '\u{1fc8}'..'\u{1fcb}' // [Ὲ..Ή] Greek Extended | |
| '\u{1fd8}'..'\u{1fdb}' // [Ῐ..Ί] Greek Extended | |
| '\u{1fe8}'..'\u{1fec}' // [Ῠ..Ῥ] Greek Extended | |
| '\u{1ff8}'..'\u{1ffb}' // [Ὸ..Ώ] Greek Extended | |
| '\u{2102}' // [ℂ] Letterlike Symbols | |
| '\u{2107}' // [ℇ] Letterlike Symbols | |
| '\u{210b}'..'\u{210d}' // [ℋ..ℍ] Letterlike Symbols | |
| '\u{2110}'..'\u{2112}' // [ℐ..ℒ] Letterlike Symbols | |
| '\u{2115}' // [ℕ] Letterlike Symbols | |
| '\u{2119}'..'\u{211d}' // [ℙ..ℝ] Letterlike Symbols | |
| '\u{2124}' // [ℤ] Letterlike Symbols | |
| '\u{2126}' // [Ω] Letterlike Symbols | |
| '\u{2128}' // [ℨ] Letterlike Symbols | |
| '\u{212a}'..'\u{212d}' // [K..ℭ] Letterlike Symbols | |
| '\u{2130}'..'\u{2133}' // [ℰ..ℳ] Letterlike Symbols | |
| '\u{213e}'..'\u{213f}' // [ℾ..ℿ] Letterlike Symbols | |
| '\u{2145}' // [ⅅ] Letterlike Symbols | |
| '\u{2183}' // [Ↄ] Number Forms | |
| '\u{2c00}'..'\u{2c2e}' // [Ⰰ..Ⱞ] Glagolitic | |
| '\u{2c60}' // [Ⱡ] Latin Extended-C | |
| '\u{2c62}'..'\u{2c64}' // [Ɫ..Ɽ] Latin Extended-C | |
| '\u{2c67}' // [Ⱨ] Latin Extended-C | |
| '\u{2c69}' // [Ⱪ] Latin Extended-C | |
| '\u{2c6b}' // [Ⱬ] Latin Extended-C | |
| '\u{2c6d}'..'\u{2c70}' // [Ɑ..Ɒ] Latin Extended-C | |
| '\u{2c72}' // [Ⱳ] Latin Extended-C | |
| '\u{2c75}' // [Ⱶ] Latin Extended-C | |
| '\u{2c7e}'..'\u{2c80}' // [Ȿ..Ⲁ] Latin Extended-C | |
| '\u{2c82}' // [Ⲃ] Coptic | |
| '\u{2c84}' // [Ⲅ] Coptic | |
| '\u{2c86}' // [Ⲇ] Coptic | |
| '\u{2c88}' // [Ⲉ] Coptic | |
| '\u{2c8a}' // [Ⲋ] Coptic | |
| '\u{2c8c}' // [Ⲍ] Coptic | |
| '\u{2c8e}' // [Ⲏ] Coptic | |
| '\u{2c90}' // [Ⲑ] Coptic | |
| '\u{2c92}' // [Ⲓ] Coptic | |
| '\u{2c94}' // [Ⲕ] Coptic | |
| '\u{2c96}' // [Ⲗ] Coptic | |
| '\u{2c98}' // [Ⲙ] Coptic | |
| '\u{2c9a}' // [Ⲛ] Coptic | |
| '\u{2c9c}' // [Ⲝ] Coptic | |
| '\u{2c9e}' // [Ⲟ] Coptic | |
| '\u{2ca0}' // [Ⲡ] Coptic | |
| '\u{2ca2}' // [Ⲣ] Coptic | |
| '\u{2ca4}' // [Ⲥ] Coptic | |
| '\u{2ca6}' // [Ⲧ] Coptic | |
| '\u{2ca8}' // [Ⲩ] Coptic | |
| '\u{2caa}' // [Ⲫ] Coptic | |
| '\u{2cac}' // [Ⲭ] Coptic | |
| '\u{2cae}' // [Ⲯ] Coptic | |
| '\u{2cb0}' // [Ⲱ] Coptic | |
| '\u{2cb2}' // [Ⲳ] Coptic | |
| '\u{2cb4}' // [Ⲵ] Coptic | |
| '\u{2cb6}' // [Ⲷ] Coptic | |
| '\u{2cb8}' // [Ⲹ] Coptic | |
| '\u{2cba}' // [Ⲻ] Coptic | |
| '\u{2cbc}' // [Ⲽ] Coptic | |
| '\u{2cbe}' // [Ⲿ] Coptic | |
| '\u{2cc0}' // [Ⳁ] Coptic | |
| '\u{2cc2}' // [Ⳃ] Coptic | |
| '\u{2cc4}' // [Ⳅ] Coptic | |
| '\u{2cc6}' // [Ⳇ] Coptic | |
| '\u{2cc8}' // [Ⳉ] Coptic | |
| '\u{2cca}' // [Ⳋ] Coptic | |
| '\u{2ccc}' // [Ⳍ] Coptic | |
| '\u{2cce}' // [Ⳏ] Coptic | |
| '\u{2cd0}' // [Ⳑ] Coptic | |
| '\u{2cd2}' // [Ⳓ] Coptic | |
| '\u{2cd4}' // [Ⳕ] Coptic | |
| '\u{2cd6}' // [Ⳗ] Coptic | |
| '\u{2cd8}' // [Ⳙ] Coptic | |
| '\u{2cda}' // [Ⳛ] Coptic | |
| '\u{2cdc}' // [Ⳝ] Coptic | |
| '\u{2cde}' // [Ⳟ] Coptic | |
| '\u{2ce0}' // [Ⳡ] Coptic | |
| '\u{2ce2}' // [Ⳣ] Coptic | |
| '\u{2ceb}' // [Ⳬ] Coptic | |
| '\u{2ced}' // [Ⳮ] Coptic | |
| '\u{2cf2}' // [Ⳳ] Coptic | |
| '\u{a640}' // [Ꙁ] Cyrillic Extended-B | |
| '\u{a642}' // [Ꙃ] Cyrillic Extended-B | |
| '\u{a644}' // [Ꙅ] Cyrillic Extended-B | |
| '\u{a646}' // [Ꙇ] Cyrillic Extended-B | |
| '\u{a648}' // [Ꙉ] Cyrillic Extended-B | |
| '\u{a64a}' // [Ꙋ] Cyrillic Extended-B | |
| '\u{a64c}' // [Ꙍ] Cyrillic Extended-B | |
| '\u{a64e}' // [Ꙏ] Cyrillic Extended-B | |
| '\u{a650}' // [Ꙑ] Cyrillic Extended-B | |
| '\u{a652}' // [Ꙓ] Cyrillic Extended-B | |
| '\u{a654}' // [Ꙕ] Cyrillic Extended-B | |
| '\u{a656}' // [Ꙗ] Cyrillic Extended-B | |
| '\u{a658}' // [Ꙙ] Cyrillic Extended-B | |
| '\u{a65a}' // [Ꙛ] Cyrillic Extended-B | |
| '\u{a65c}' // [Ꙝ] Cyrillic Extended-B | |
| '\u{a65e}' // [Ꙟ] Cyrillic Extended-B | |
| '\u{a660}' // [Ꙡ] Cyrillic Extended-B | |
| '\u{a662}' // [Ꙣ] Cyrillic Extended-B | |
| '\u{a664}' // [Ꙥ] Cyrillic Extended-B | |
| '\u{a666}' // [Ꙧ] Cyrillic Extended-B | |
| '\u{a668}' // [Ꙩ] Cyrillic Extended-B | |
| '\u{a66a}' // [Ꙫ] Cyrillic Extended-B | |
| '\u{a66c}' // [Ꙭ] Cyrillic Extended-B | |
| '\u{a680}' // [Ꚁ] Cyrillic Extended-B | |
| '\u{a682}' // [Ꚃ] Cyrillic Extended-B | |
| '\u{a684}' // [Ꚅ] Cyrillic Extended-B | |
| '\u{a686}' // [Ꚇ] Cyrillic Extended-B | |
| '\u{a688}' // [Ꚉ] Cyrillic Extended-B | |
| '\u{a68a}' // [Ꚋ] Cyrillic Extended-B | |
| '\u{a68c}' // [Ꚍ] Cyrillic Extended-B | |
| '\u{a68e}' // [Ꚏ] Cyrillic Extended-B | |
| '\u{a690}' // [Ꚑ] Cyrillic Extended-B | |
| '\u{a692}' // [Ꚓ] Cyrillic Extended-B | |
| '\u{a694}' // [Ꚕ] Cyrillic Extended-B | |
| '\u{a696}' // [Ꚗ] Cyrillic Extended-B | |
| '\u{a698}' // [Ꚙ] Cyrillic Extended-B | |
| '\u{a69a}' // [Ꚛ] Cyrillic Extended-B | |
| '\u{a722}' // [Ꜣ] Latin Extended-D | |
| '\u{a724}' // [Ꜥ] Latin Extended-D | |
| '\u{a726}' // [Ꜧ] Latin Extended-D | |
| '\u{a728}' // [Ꜩ] Latin Extended-D | |
| '\u{a72a}' // [Ꜫ] Latin Extended-D | |
| '\u{a72c}' // [Ꜭ] Latin Extended-D | |
| '\u{a72e}' // [Ꜯ] Latin Extended-D | |
| '\u{a732}' // [Ꜳ] Latin Extended-D | |
| '\u{a734}' // [Ꜵ] Latin Extended-D | |
| '\u{a736}' // [Ꜷ] Latin Extended-D | |
| '\u{a738}' // [Ꜹ] Latin Extended-D | |
| '\u{a73a}' // [Ꜻ] Latin Extended-D | |
| '\u{a73c}' // [Ꜽ] Latin Extended-D | |
| '\u{a73e}' // [Ꜿ] Latin Extended-D | |
| '\u{a740}' // [Ꝁ] Latin Extended-D | |
| '\u{a742}' // [Ꝃ] Latin Extended-D | |
| '\u{a744}' // [Ꝅ] Latin Extended-D | |
| '\u{a746}' // [Ꝇ] Latin Extended-D | |
| '\u{a748}' // [Ꝉ] Latin Extended-D | |
| '\u{a74a}' // [Ꝋ] Latin Extended-D | |
| '\u{a74c}' // [Ꝍ] Latin Extended-D | |
| '\u{a74e}' // [Ꝏ] Latin Extended-D | |
| '\u{a750}' // [Ꝑ] Latin Extended-D | |
| '\u{a752}' // [Ꝓ] Latin Extended-D | |
| '\u{a754}' // [Ꝕ] Latin Extended-D | |
| '\u{a756}' // [Ꝗ] Latin Extended-D | |
| '\u{a758}' // [Ꝙ] Latin Extended-D | |
| '\u{a75a}' // [Ꝛ] Latin Extended-D | |
| '\u{a75c}' // [Ꝝ] Latin Extended-D | |
| '\u{a75e}' // [Ꝟ] Latin Extended-D | |
| '\u{a760}' // [Ꝡ] Latin Extended-D | |
| '\u{a762}' // [Ꝣ] Latin Extended-D | |
| '\u{a764}' // [Ꝥ] Latin Extended-D | |
| '\u{a766}' // [Ꝧ] Latin Extended-D | |
| '\u{a768}' // [Ꝩ] Latin Extended-D | |
| '\u{a76a}' // [Ꝫ] Latin Extended-D | |
| '\u{a76c}' // [Ꝭ] Latin Extended-D | |
| '\u{a76e}' // [Ꝯ] Latin Extended-D | |
| '\u{a779}' // [Ꝺ] Latin Extended-D | |
| '\u{a77b}' // [Ꝼ] Latin Extended-D | |
| '\u{a77d}'..'\u{a77e}' // [Ᵹ..Ꝿ] Latin Extended-D | |
| '\u{a780}' // [Ꞁ] Latin Extended-D | |
| '\u{a782}' // [Ꞃ] Latin Extended-D | |
| '\u{a784}' // [Ꞅ] Latin Extended-D | |
| '\u{a786}' // [Ꞇ] Latin Extended-D | |
| '\u{a78b}' // [Ꞌ] Latin Extended-D | |
| '\u{a78d}' // [Ɥ] Latin Extended-D | |
| '\u{a790}' // [Ꞑ] Latin Extended-D | |
| '\u{a792}' // [Ꞓ] Latin Extended-D | |
| '\u{a796}' // [Ꞗ] Latin Extended-D | |
| '\u{a798}' // [Ꞙ] Latin Extended-D | |
| '\u{a79a}' // [Ꞛ] Latin Extended-D | |
| '\u{a79c}' // [Ꞝ] Latin Extended-D | |
| '\u{a79e}' // [Ꞟ] Latin Extended-D | |
| '\u{a7a0}' // [Ꞡ] Latin Extended-D | |
| '\u{a7a2}' // [Ꞣ] Latin Extended-D | |
| '\u{a7a4}' // [Ꞥ] Latin Extended-D | |
| '\u{a7a6}' // [Ꞧ] Latin Extended-D | |
| '\u{a7a8}' // [Ꞩ] Latin Extended-D | |
| '\u{a7aa}'..'\u{a7b4}' // [Ɦ..Ꞵ] Latin Extended-D | |
| '\u{a7b6}' // [Ꞷ] Latin Extended-D | |
| '\u{ff21}'..'\u{ff3a}' // [A..Z] Halfwidth and Fullwidth Forms | |
| '\u{10400}'..'\u{10427}' // [𐐀..𐐧] Deseret | |
| '\u{104b0}'..'\u{104d3}' // [𐒰..𐓓] Osage | |
| '\u{10c80}'..'\u{10cb2}' // [𐲀..𐲲] Old Hungarian | |
| '\u{118a0}'..'\u{118bf}' // [𑢠..𑢿] Warang Citi | |
| '\u{1d400}'..'\u{1d419}' // [𝐀..𝐙] Mathematical Alphanumeric Symbols | |
| '\u{1d434}'..'\u{1d44d}' // [𝐴..𝑍] Mathematical Alphanumeric Symbols | |
| '\u{1d468}'..'\u{1d481}' // [𝑨..𝒁] Mathematical Alphanumeric Symbols | |
| '\u{1d49c}'..'\u{1d4b5}' // [𝒜..𝒵] Mathematical Alphanumeric Symbols | |
| '\u{1d4d0}'..'\u{1d4e9}' // [𝓐..𝓩] Mathematical Alphanumeric Symbols | |
| '\u{1d504}'..'\u{1d51c}' // [𝔄..𝔜] Mathematical Alphanumeric Symbols | |
| '\u{1d538}'..'\u{1d550}' // [𝔸..𝕐] Mathematical Alphanumeric Symbols | |
| '\u{1d56c}'..'\u{1d585}' // [𝕬..𝖅] Mathematical Alphanumeric Symbols | |
| '\u{1d5a0}'..'\u{1d5b9}' // [𝖠..𝖹] Mathematical Alphanumeric Symbols | |
| '\u{1d5d4}'..'\u{1d5ed}' // [𝗔..𝗭] Mathematical Alphanumeric Symbols | |
| '\u{1d608}'..'\u{1d621}' // [𝘈..𝘡] Mathematical Alphanumeric Symbols | |
| '\u{1d63c}'..'\u{1d655}' // [𝘼..𝙕] Mathematical Alphanumeric Symbols | |
| '\u{1d670}'..'\u{1d689}' // [𝙰..𝚉] Mathematical Alphanumeric Symbols | |
| '\u{1d6a8}'..'\u{1d6c0}' // [𝚨..𝛀] Mathematical Alphanumeric Symbols | |
| '\u{1d6e2}'..'\u{1d6fa}' // [𝛢..𝛺] Mathematical Alphanumeric Symbols | |
| '\u{1d71c}'..'\u{1d734}' // [𝜜..𝜴] Mathematical Alphanumeric Symbols | |
| '\u{1d756}'..'\u{1d76e}' // [𝝖..𝝮] Mathematical Alphanumeric Symbols | |
| '\u{1d790}'..'\u{1d7a8}' // [𝞐..𝞨] Mathematical Alphanumeric Symbols | |
| '\u{1d7ca}' // [𝟊] Mathematical Alphanumeric Symbols | |
| '\u{1e900}'..'\u{1e921}' // [𞤀..𞤡] Adlam | |
; | |
CLASSIFY_Mc: // Spacing_Mark | |
'\u{0903}' // [ः] Devanagari | |
| '\u{093b}' // [ऻ] Devanagari | |
| '\u{093e}'..'\u{0940}' // [ा..ी] Devanagari | |
| '\u{0949}'..'\u{094c}' // [ॉ..ौ] Devanagari | |
| '\u{094e}'..'\u{094f}' // [ॎ..ॏ] Devanagari | |
| '\u{0982}'..'\u{0983}' // [ং..ঃ] Bengali | |
| '\u{09be}'..'\u{09c0}' // [া..ী] Bengali | |
| '\u{09c7}'..'\u{09cc}' // [ে..ৌ] Bengali | |
| '\u{09d7}' // [ৗ] Bengali | |
| '\u{0a03}' // [ਃ] Gurmukhi | |
| '\u{0a3e}'..'\u{0a40}' // [ਾ..ੀ] Gurmukhi | |
| '\u{0a83}' // [ઃ] Gujarati | |
| '\u{0abe}'..'\u{0ac0}' // [ા..ી] Gujarati | |
| '\u{0ac9}'..'\u{0acc}' // [ૉ..ૌ] Gujarati | |
| '\u{0b02}'..'\u{0b03}' // [ଂ..ଃ] Oriya | |
| '\u{0b3e}' // [ା] Oriya | |
| '\u{0b40}' // [ୀ] Oriya | |
| '\u{0b47}'..'\u{0b4c}' // [େ..ୌ] Oriya | |
| '\u{0b57}' // [ୗ] Oriya | |
| '\u{0bbe}'..'\u{0bbf}' // [ா..ி] Tamil | |
| '\u{0bc1}'..'\u{0bcc}' // [ு..ௌ] Tamil | |
| '\u{0bd7}' // [ௗ] Tamil | |
| '\u{0c01}'..'\u{0c03}' // [ఁ..ః] Telugu | |
| '\u{0c41}'..'\u{0c44}' // [ు..ౄ] Telugu | |
| '\u{0c82}'..'\u{0c83}' // [ಂ..ಃ] Kannada | |
| '\u{0cbe}' // [ಾ] Kannada | |
| '\u{0cc0}'..'\u{0cc4}' // [ೀ..ೄ] Kannada | |
| '\u{0cc7}'..'\u{0ccb}' // [ೇ..ೋ] Kannada | |
| '\u{0cd5}'..'\u{0cd6}' // [ೕ..ೖ] Kannada | |
| '\u{0d02}'..'\u{0d03}' // [ം..ഃ] Malayalam | |
| '\u{0d3e}'..'\u{0d40}' // [ാ..ീ] Malayalam | |
| '\u{0d46}'..'\u{0d4c}' // [െ..ൌ] Malayalam | |
| '\u{0d57}' // [ൗ] Malayalam | |
| '\u{0d82}'..'\u{0d83}' // [ං..ඃ] Sinhala | |
| '\u{0dcf}'..'\u{0dd1}' // [ා..ෑ] Sinhala | |
| '\u{0dd8}'..'\u{0ddf}' // [ෘ..ෟ] Sinhala | |
| '\u{0df2}'..'\u{0df3}' // [ෲ..ෳ] Sinhala | |
| '\u{0f3e}'..'\u{0f3f}' // [༾..༿] Tibetan | |
| '\u{0f7f}' // [ཿ] Tibetan | |
| '\u{102b}'..'\u{102c}' // [ါ..ာ] Myanmar | |
| '\u{1031}' // [ေ] Myanmar | |
| '\u{1038}' // [း] Myanmar | |
| '\u{103b}'..'\u{103c}' // [ျ..ြ] Myanmar | |
| '\u{1056}'..'\u{1057}' // [ၖ..ၗ] Myanmar | |
| '\u{1062}'..'\u{1064}' // [ၢ..ၤ] Myanmar | |
| '\u{1067}'..'\u{106d}' // [ၧ..ၭ] Myanmar | |
| '\u{1083}'..'\u{1084}' // [ႃ..ႄ] Myanmar | |
| '\u{1087}'..'\u{108c}' // [ႇ..ႌ] Myanmar | |
| '\u{108f}' // [ႏ] Myanmar | |
| '\u{109a}'..'\u{109c}' // [ႚ..ႜ] Myanmar | |
| '\u{17b6}' // [ា] Khmer | |
| '\u{17be}'..'\u{17c5}' // [ើ..ៅ] Khmer | |
| '\u{17c7}'..'\u{17c8}' // [ះ..ៈ] Khmer | |
| '\u{1923}'..'\u{1926}' // [ᤣ..ᤦ] Limbu | |
| '\u{1929}'..'\u{1931}' // [ᤩ..ᤱ] Limbu | |
| '\u{1933}'..'\u{1938}' // [ᤳ..ᤸ] Limbu | |
| '\u{1a19}'..'\u{1a1a}' // [ᨙ..ᨚ] Buginese | |
| '\u{1a55}' // [ᩕ] Tai Tham | |
| '\u{1a57}' // [ᩗ] Tai Tham | |
| '\u{1a61}' // [ᩡ] Tai Tham | |
| '\u{1a63}'..'\u{1a64}' // [ᩣ..ᩤ] Tai Tham | |
| '\u{1a6d}'..'\u{1a72}' // [ᩭ..ᩲ] Tai Tham | |
| '\u{1b04}' // [ᬄ] Balinese | |
| '\u{1b35}' // [ᬵ] Balinese | |
| '\u{1b3b}' // [ᬻ] Balinese | |
| '\u{1b3d}'..'\u{1b41}' // [ᬽ..ᭁ] Balinese | |
| '\u{1b43}'..'\u{1b44}' // [ᭃ..᭄] Balinese | |
| '\u{1b82}' // [ᮂ] Sundanese | |
| '\u{1ba1}' // [ᮡ] Sundanese | |
| '\u{1ba6}'..'\u{1ba7}' // [ᮦ..ᮧ] Sundanese | |
| '\u{1baa}' // [᮪] Sundanese | |
| '\u{1be7}' // [ᯧ] Batak | |
| '\u{1bea}'..'\u{1bec}' // [ᯪ..ᯬ] Batak | |
| '\u{1bee}' // [ᯮ] Batak | |
| '\u{1bf2}'..'\u{1bf3}' // [᯲..᯳] Batak | |
| '\u{1c24}'..'\u{1c2b}' // [ᰤ..ᰫ] Lepcha | |
| '\u{1c34}'..'\u{1c35}' // [ᰴ..ᰵ] Lepcha | |
| '\u{1ce1}' // [᳡] Vedic Extensions | |
| '\u{1cf2}'..'\u{1cf3}' // [ᳲ..ᳳ] Vedic Extensions | |
| '\u{302e}'..'\u{302f}' // [〮..〯] CJK Symbols and Punctuation | |
| '\u{a823}'..'\u{a824}' // [ꠣ..ꠤ] Syloti Nagri | |
| '\u{a827}' // [ꠧ] Syloti Nagri | |
| '\u{a880}'..'\u{a881}' // [ꢀ..ꢁ] Saurashtra | |
| '\u{a8b4}'..'\u{a8c3}' // [ꢴ..ꣃ] Saurashtra | |
| '\u{a952}'..'\u{a953}' // [ꥒ..꥓] Rejang | |
| '\u{a983}' // [ꦃ] Javanese | |
| '\u{a9b4}'..'\u{a9b5}' // [ꦴ..ꦵ] Javanese | |
| '\u{a9ba}'..'\u{a9bb}' // [ꦺ..ꦻ] Javanese | |
| '\u{a9bd}'..'\u{a9c0}' // [ꦽ..꧀] Javanese | |
| '\u{aa2f}'..'\u{aa30}' // [ꨯ..ꨰ] Cham | |
| '\u{aa33}'..'\u{aa34}' // [ꨳ..ꨴ] Cham | |
| '\u{aa4d}' // [ꩍ] Cham | |
| '\u{aa7b}' // [ꩻ] Myanmar Extended-A | |
| '\u{aa7d}' // [ꩽ] Myanmar Extended-A | |
| '\u{aaeb}' // [ꫫ] Meetei Mayek Extensions | |
| '\u{aaee}'..'\u{aaef}' // [ꫮ..ꫯ] Meetei Mayek Extensions | |
| '\u{aaf5}' // [ꫵ] Meetei Mayek Extensions | |
| '\u{abe3}'..'\u{abe4}' // [ꯣ..ꯤ] Meetei Mayek | |
| '\u{abe6}'..'\u{abe7}' // [ꯦ..ꯧ] Meetei Mayek | |
| '\u{abe9}'..'\u{abea}' // [ꯩ..ꯪ] Meetei Mayek | |
| '\u{abec}' // [꯬] Meetei Mayek | |
| '\u{11000}' // [𑀀] Brahmi | |
| '\u{11002}' // [𑀂] Brahmi | |
| '\u{11082}' // [𑂂] Kaithi | |
| '\u{110b0}'..'\u{110b2}' // [𑂰..𑂲] Kaithi | |
| '\u{110b7}'..'\u{110b8}' // [𑂷..𑂸] Kaithi | |
| '\u{1112c}' // [𑄬] Chakma | |
| '\u{11182}' // [𑆂] Sharada | |
| '\u{111b3}'..'\u{111b5}' // [𑆳..𑆵] Sharada | |
| '\u{111bf}'..'\u{111c0}' // [𑆿..𑇀] Sharada | |
| '\u{1122c}'..'\u{1122e}' // [𑈬..𑈮] Khojki | |
| '\u{11232}'..'\u{11233}' // [𑈲..𑈳] Khojki | |
| '\u{11235}' // [𑈵] Khojki | |
| '\u{112e0}'..'\u{112e2}' // [𑋠..𑋢] Khudawadi | |
| '\u{11302}'..'\u{11303}' // [𑌂..𑌃] Grantha | |
| '\u{1133e}'..'\u{1133f}' // [𑌾..𑌿] Grantha | |
| '\u{11341}'..'\u{1134d}' // [𑍁..𑍍] Grantha | |
| '\u{11357}' // [𑍗] Grantha | |
| '\u{11362}'..'\u{11363}' // [𑍢..𑍣] Grantha | |
| '\u{11435}'..'\u{11437}' // [𑐵..𑐷] Newa | |
| '\u{11440}'..'\u{11441}' // [𑑀..𑑁] Newa | |
| '\u{11445}' // [𑑅] Newa | |
| '\u{114b0}'..'\u{114b2}' // [𑒰..𑒲] Tirhuta | |
| '\u{114b9}' // [𑒹] Tirhuta | |
| '\u{114bb}'..'\u{114be}' // [𑒻..𑒾] Tirhuta | |
| '\u{114c1}' // [𑓁] Tirhuta | |
| '\u{115af}'..'\u{115b1}' // [𑖯..𑖱] Siddham | |
| '\u{115b8}'..'\u{115bb}' // [𑖸..𑖻] Siddham | |
| '\u{115be}' // [𑖾] Siddham | |
| '\u{11630}'..'\u{11632}' // [𑘰..𑘲] Modi | |
| '\u{1163b}'..'\u{1163c}' // [𑘻..𑘼] Modi | |
| '\u{1163e}' // [𑘾] Modi | |
| '\u{116ac}' // [𑚬] Takri | |
| '\u{116ae}'..'\u{116af}' // [𑚮..𑚯] Takri | |
| '\u{116b6}' // [𑚶] Takri | |
| '\u{11720}'..'\u{11721}' // [𑜠..𑜡] Ahom | |
| '\u{11726}' // [𑜦] Ahom | |
| '\u{11c2f}' // [𑰯] Bhaiksuki | |
| '\u{11c3e}' // [𑰾] Bhaiksuki | |
| '\u{11ca9}' // [𑲩] Marchen | |
| '\u{11cb1}' // [𑲱] Marchen | |
| '\u{11cb4}' // [𑲴] Marchen | |
| '\u{16f51}'..'\u{16f7e}' // [𖽑..𖽾] Miao | |
| '\u{1d165}'..'\u{1d166}' // [𝅥..𝅦] Musical Symbols | |
| '\u{1d16d}'..'\u{1d172}' // [𝅭..𝅲] Musical Symbols | |
; | |
CLASSIFY_Me: // Enclosing_Mark | |
'\u{0488}'..'\u{0489}' // [҈..҉] Cyrillic | |
| '\u{1abe}' // [᪾] Combining Diacritical Marks Extended | |
| '\u{20dd}'..'\u{20e0}' // [⃝..⃠] Combining Diacritical Marks for Symbols | |
| '\u{20e2}'..'\u{20e4}' // [⃢..⃤] Combining Diacritical Marks for Symbols | |
| '\u{a670}'..'\u{a672}' // [꙰..꙲] Cyrillic Extended-B | |
; | |
CLASSIFY_Mn: // Nonspacing_Mark | |
'\u{0300}'..'\u{036f}' // [̀..ͯ] Combining Diacritical Marks | |
| '\u{0483}'..'\u{0487}' // [҃..҇] Cyrillic | |
| '\u{0591}'..'\u{05bd}' // [֑..ֽ] Hebrew | |
| '\u{05bf}' // [ֿ] Hebrew | |
| '\u{05c1}'..'\u{05c2}' // [ׁ..ׂ] Hebrew | |
| '\u{05c4}'..'\u{05c5}' // [ׄ..ׅ] Hebrew | |
| '\u{05c7}' // [ׇ] Hebrew | |
| '\u{0610}'..'\u{061a}' // [ؐ..ؚ] Arabic | |
| '\u{064b}'..'\u{065f}' // [ً..ٟ] Arabic | |
| '\u{0670}' // [ٰ] Arabic | |
| '\u{06d6}'..'\u{06dc}' // [ۖ..ۜ] Arabic | |
| '\u{06df}'..'\u{06e4}' // [۟..ۤ] Arabic | |
| '\u{06e7}'..'\u{06e8}' // [ۧ..ۨ] Arabic | |
| '\u{06ea}'..'\u{06ed}' // [۪..ۭ] Arabic | |
| '\u{0711}' // [ܑ] Syriac | |
| '\u{0730}'..'\u{074a}' // [ܰ..݊] Syriac | |
| '\u{07a6}'..'\u{07b0}' // [ަ..ް] Thaana | |
| '\u{07eb}'..'\u{07f3}' // [߫..߳] NKo | |
| '\u{0816}'..'\u{0819}' // [ࠖ..࠙] Samaritan | |
| '\u{081b}'..'\u{0823}' // [ࠛ..ࠣ] Samaritan | |
| '\u{0825}'..'\u{0827}' // [ࠥ..ࠧ] Samaritan | |
| '\u{0829}'..'\u{082d}' // [ࠩ..࠭] Samaritan | |
| '\u{0859}'..'\u{085b}' // [࡙..࡛] Mandaic | |
| '\u{08d4}'..'\u{08e1}' // [ࣔ..࣡] Arabic Extended-A | |
| '\u{08e3}'..'\u{0902}' // [ࣣ..ं] Arabic Extended-A | |
| '\u{093a}' // [ऺ] Devanagari | |
| '\u{093c}' // [़] Devanagari | |
| '\u{0941}'..'\u{0948}' // [ु..ै] Devanagari | |
| '\u{094d}' // [्] Devanagari | |
| '\u{0951}'..'\u{0957}' // [॑..ॗ] Devanagari | |
| '\u{0962}'..'\u{0963}' // [ॢ..ॣ] Devanagari | |
| '\u{0981}' // [ঁ] Bengali | |
| '\u{09bc}' // [়] Bengali | |
| '\u{09c1}'..'\u{09c4}' // [ু..ৄ] Bengali | |
| '\u{09cd}' // [্] Bengali | |
| '\u{09e2}'..'\u{09e3}' // [ৢ..ৣ] Bengali | |
| '\u{0a01}'..'\u{0a02}' // [ਁ..ਂ] Gurmukhi | |
| '\u{0a3c}' // [਼] Gurmukhi | |
| '\u{0a41}'..'\u{0a51}' // [ੁ..ੑ] Gurmukhi | |
| '\u{0a70}'..'\u{0a71}' // [ੰ..ੱ] Gurmukhi | |
| '\u{0a75}'..'\u{0a82}' // [ੵ..ં] Gurmukhi | |
| '\u{0abc}' // [઼] Gujarati | |
| '\u{0ac1}'..'\u{0ac8}' // [ુ..ૈ] Gujarati | |
| '\u{0acd}' // [્] Gujarati | |
| '\u{0ae2}'..'\u{0ae3}' // [ૢ..ૣ] Gujarati | |
| '\u{0b01}' // [ଁ] Oriya | |
| '\u{0b3c}' // [଼] Oriya | |
| '\u{0b3f}' // [ି] Oriya | |
| '\u{0b41}'..'\u{0b44}' // [ୁ..ୄ] Oriya | |
| '\u{0b4d}'..'\u{0b56}' // [୍..ୖ] Oriya | |
| '\u{0b62}'..'\u{0b63}' // [ୢ..ୣ] Oriya | |
| '\u{0b82}' // [ஂ] Tamil | |
| '\u{0bc0}' // [ீ] Tamil | |
| '\u{0bcd}' // [்] Tamil | |
| '\u{0c00}' // [ఀ] Telugu | |
| '\u{0c3e}'..'\u{0c40}' // [ా..ీ] Telugu | |
| '\u{0c46}'..'\u{0c56}' // [ె..ౖ] Telugu | |
| '\u{0c62}'..'\u{0c63}' // [ౢ..ౣ] Telugu | |
| '\u{0c81}' // [ಁ] Kannada | |
| '\u{0cbc}' // [಼] Kannada | |
| '\u{0cbf}' // [ಿ] Kannada | |
| '\u{0cc6}' // [ೆ] Kannada | |
| '\u{0ccc}'..'\u{0ccd}' // [ೌ..್] Kannada | |
| '\u{0ce2}'..'\u{0ce3}' // [ೢ..ೣ] Kannada | |
| '\u{0d01}' // [ഁ] Malayalam | |
| '\u{0d41}'..'\u{0d44}' // [ു..ൄ] Malayalam | |
| '\u{0d4d}' // [്] Malayalam | |
| '\u{0d62}'..'\u{0d63}' // [ൢ..ൣ] Malayalam | |
| '\u{0dca}' // [්] Sinhala | |
| '\u{0dd2}'..'\u{0dd6}' // [ි..ූ] Sinhala | |
| '\u{0e31}' // [ั] Thai | |
| '\u{0e34}'..'\u{0e3a}' // [ิ..ฺ] Thai | |
| '\u{0e47}'..'\u{0e4e}' // [็..๎] Thai | |
| '\u{0eb1}' // [ັ] Lao | |
| '\u{0eb4}'..'\u{0ebc}' // [ິ..ຼ] Lao | |
| '\u{0ec8}'..'\u{0ecd}' // [່..ໍ] Lao | |
| '\u{0f18}'..'\u{0f19}' // [༘..༙] Tibetan | |
| '\u{0f35}' // [༵] Tibetan | |
| '\u{0f37}' // [༷] Tibetan | |
| '\u{0f39}' // [༹] Tibetan | |
| '\u{0f71}'..'\u{0f7e}' // [ཱ..ཾ] Tibetan | |
| '\u{0f80}'..'\u{0f84}' // [ྀ..྄] Tibetan | |
| '\u{0f86}'..'\u{0f87}' // [྆..྇] Tibetan | |
| '\u{0f8d}'..'\u{0fbc}' // [ྍ..ྼ] Tibetan | |
| '\u{0fc6}' // [࿆] Tibetan | |
| '\u{102d}'..'\u{1030}' // [ိ..ူ] Myanmar | |
| '\u{1032}'..'\u{1037}' // [ဲ..့] Myanmar | |
| '\u{1039}'..'\u{103a}' // [္..်] Myanmar | |
| '\u{103d}'..'\u{103e}' // [ွ..ှ] Myanmar | |
| '\u{1058}'..'\u{1059}' // [ၘ..ၙ] Myanmar | |
| '\u{105e}'..'\u{1060}' // [ၞ..ၠ] Myanmar | |
| '\u{1071}'..'\u{1074}' // [ၱ..ၴ] Myanmar | |
| '\u{1082}' // [ႂ] Myanmar | |
| '\u{1085}'..'\u{1086}' // [ႅ..ႆ] Myanmar | |
| '\u{108d}' // [ႍ] Myanmar | |
| '\u{109d}' // [ႝ] Myanmar | |
| '\u{135d}'..'\u{135f}' // [፝..፟] Ethiopic | |
| '\u{1712}'..'\u{1714}' // [ᜒ..᜔] Tagalog | |
| '\u{1732}'..'\u{1734}' // [ᜲ..᜴] Hanunoo | |
| '\u{1752}'..'\u{1753}' // [ᝒ..ᝓ] Buhid | |
| '\u{1772}'..'\u{1773}' // [ᝲ..ᝳ] Tagbanwa | |
| '\u{17b4}'..'\u{17b5}' // [឴..឵] Khmer | |
| '\u{17b7}'..'\u{17bd}' // [ិ..ួ] Khmer | |
| '\u{17c6}' // [ំ] Khmer | |
| '\u{17c9}'..'\u{17d3}' // [៉..៓] Khmer | |
| '\u{17dd}' // [៝] Khmer | |
| '\u{180b}'..'\u{180d}' // [᠋..᠍] Mongolian | |
| '\u{1885}'..'\u{1886}' // [ᢅ..ᢆ] Mongolian | |
| '\u{18a9}' // [ᢩ] Mongolian | |
| '\u{1920}'..'\u{1922}' // [ᤠ..ᤢ] Limbu | |
| '\u{1927}'..'\u{1928}' // [ᤧ..ᤨ] Limbu | |
| '\u{1932}' // [ᤲ] Limbu | |
| '\u{1939}'..'\u{193b}' // [᤹..᤻] Limbu | |
| '\u{1a17}'..'\u{1a18}' // [ᨗ..ᨘ] Buginese | |
| '\u{1a1b}' // [ᨛ] Buginese | |
| '\u{1a56}' // [ᩖ] Tai Tham | |
| '\u{1a58}'..'\u{1a60}' // [ᩘ..᩠] Tai Tham | |
| '\u{1a62}' // [ᩢ] Tai Tham | |
| '\u{1a65}'..'\u{1a6c}' // [ᩥ..ᩬ] Tai Tham | |
| '\u{1a73}'..'\u{1a7f}' // [ᩳ..᩿] Tai Tham | |
| '\u{1ab0}'..'\u{1abd}' // [᪰..᪽] Combining Diacritical Marks Extended | |
| '\u{1b00}'..'\u{1b03}' // [ᬀ..ᬃ] Balinese | |
| '\u{1b34}' // [᬴] Balinese | |
| '\u{1b36}'..'\u{1b3a}' // [ᬶ..ᬺ] Balinese | |
| '\u{1b3c}' // [ᬼ] Balinese | |
| '\u{1b42}' // [ᭂ] Balinese | |
| '\u{1b6b}'..'\u{1b73}' // [᭫..᭳] Balinese | |
| '\u{1b80}'..'\u{1b81}' // [ᮀ..ᮁ] Sundanese | |
| '\u{1ba2}'..'\u{1ba5}' // [ᮢ..ᮥ] Sundanese | |
| '\u{1ba8}'..'\u{1ba9}' // [ᮨ..ᮩ] Sundanese | |
| '\u{1bab}'..'\u{1bad}' // [᮫..ᮭ] Sundanese | |
| '\u{1be6}' // [᯦] Batak | |
| '\u{1be8}'..'\u{1be9}' // [ᯨ..ᯩ] Batak | |
| '\u{1bed}' // [ᯭ] Batak | |
| '\u{1bef}'..'\u{1bf1}' // [ᯯ..ᯱ] Batak | |
| '\u{1c2c}'..'\u{1c33}' // [ᰬ..ᰳ] Lepcha | |
| '\u{1c36}'..'\u{1c37}' // [ᰶ..᰷] Lepcha | |
| '\u{1cd0}'..'\u{1cd2}' // [᳐..᳒] Vedic Extensions | |
| '\u{1cd4}'..'\u{1ce0}' // [᳔..᳠] Vedic Extensions | |
| '\u{1ce2}'..'\u{1ce8}' // [᳢..᳨] Vedic Extensions | |
| '\u{1ced}' // [᳭] Vedic Extensions | |
| '\u{1cf4}' // [᳴] Vedic Extensions | |
| '\u{1cf8}'..'\u{1cf9}' // [᳸..᳹] Vedic Extensions | |
| '\u{1dc0}'..'\u{1dff}' // [᷀..᷿] Combining Diacritical Marks Supplement | |
| '\u{20d0}'..'\u{20dc}' // [⃐..⃜] Combining Diacritical Marks for Symbols | |
| '\u{20e1}' // [⃡] Combining Diacritical Marks for Symbols | |
| '\u{20e5}'..'\u{20f0}' // [⃥..⃰] Combining Diacritical Marks for Symbols | |
| '\u{2cef}'..'\u{2cf1}' // [⳯..⳱] Coptic | |
| '\u{2d7f}' // [⵿] Tifinagh | |
| '\u{2de0}'..'\u{2dff}' // [ⷠ..ⷿ] Cyrillic Extended-A | |
| '\u{302a}'..'\u{302d}' // [〪..〭] CJK Symbols and Punctuation | |
| '\u{3099}'..'\u{309a}' // [゙..゚] Hiragana | |
| '\u{a66f}' // [꙯] Cyrillic Extended-B | |
| '\u{a674}'..'\u{a67d}' // [ꙴ..꙽] Cyrillic Extended-B | |
| '\u{a69e}'..'\u{a69f}' // [ꚞ..ꚟ] Cyrillic Extended-B | |
| '\u{a6f0}'..'\u{a6f1}' // [꛰..꛱] Bamum | |
| '\u{a802}' // [ꠂ] Syloti Nagri | |
| '\u{a806}' // [꠆] Syloti Nagri | |
| '\u{a80b}' // [ꠋ] Syloti Nagri | |
| '\u{a825}'..'\u{a826}' // [ꠥ..ꠦ] Syloti Nagri | |
| '\u{a8c4}'..'\u{a8c5}' // [꣄..ꣅ] Saurashtra | |
| '\u{a8e0}'..'\u{a8f1}' // [꣠..꣱] Devanagari Extended | |
| '\u{a926}'..'\u{a92d}' // [ꤦ..꤭] Kayah Li | |
| '\u{a947}'..'\u{a951}' // [ꥇ..ꥑ] Rejang | |
| '\u{a980}'..'\u{a982}' // [ꦀ..ꦂ] Javanese | |
| '\u{a9b3}' // [꦳] Javanese | |
| '\u{a9b6}'..'\u{a9b9}' // [ꦶ..ꦹ] Javanese | |
| '\u{a9bc}' // [ꦼ] Javanese | |
| '\u{a9e5}' // [ꧥ] Myanmar Extended-B | |
| '\u{aa29}'..'\u{aa2e}' // [ꨩ..ꨮ] Cham | |
| '\u{aa31}'..'\u{aa32}' // [ꨱ..ꨲ] Cham | |
| '\u{aa35}'..'\u{aa36}' // [ꨵ..ꨶ] Cham | |
| '\u{aa43}' // [ꩃ] Cham | |
| '\u{aa4c}' // [ꩌ] Cham | |
| '\u{aa7c}' // [ꩼ] Myanmar Extended-A | |
| '\u{aab0}' // [ꪰ] Tai Viet | |
| '\u{aab2}'..'\u{aab4}' // [ꪲ..ꪴ] Tai Viet | |
| '\u{aab7}'..'\u{aab8}' // [ꪷ..ꪸ] Tai Viet | |
| '\u{aabe}'..'\u{aabf}' // [ꪾ..꪿] Tai Viet | |
| '\u{aac1}' // [꫁] Tai Viet | |
| '\u{aaec}'..'\u{aaed}' // [ꫬ..ꫭ] Meetei Mayek Extensions | |
| '\u{aaf6}' // [꫶] Meetei Mayek Extensions | |
| '\u{abe5}' // [ꯥ] Meetei Mayek | |
| '\u{abe8}' // [ꯨ] Meetei Mayek | |
| '\u{abed}' // [꯭] Meetei Mayek | |
| '\u{fb1e}' // [ﬞ] Alphabetic Presentation Forms | |
| '\u{fe00}'..'\u{fe0f}' // [︀..️] Variation Selectors | |
| '\u{fe20}'..'\u{fe2f}' // [︠..︯] Combining Half Marks | |
| '\u{101fd}' // [𐇽] Phaistos Disc | |
| '\u{102e0}' // [𐋠] Coptic Epact Numbers | |
| '\u{10376}'..'\u{1037a}' // [𐍶..𐍺] Old Permic | |
| '\u{10a01}'..'\u{10a0f}' // [𐨁..𐨏] Kharoshthi | |
| '\u{10a38}'..'\u{10a3f}' // [𐨸..𐨿] Kharoshthi | |
| '\u{10ae5}'..'\u{10ae6}' // [𐫥..𐫦] Manichaean | |
| '\u{11001}' // [𑀁] Brahmi | |
| '\u{11038}'..'\u{11046}' // [𑀸..𑁆] Brahmi | |
| '\u{1107f}'..'\u{11081}' // [𑁿..𑂁] Brahmi | |
| '\u{110b3}'..'\u{110b6}' // [𑂳..𑂶] Kaithi | |
| '\u{110b9}'..'\u{110ba}' // [𑂹..𑂺] Kaithi | |
| '\u{11100}'..'\u{11102}' // [𑄀..𑄂] Chakma | |
| '\u{11127}'..'\u{1112b}' // [𑄧..𑄫] Chakma | |
| '\u{1112d}'..'\u{11134}' // [𑄭..𑄴] Chakma | |
| '\u{11173}' // [𑅳] Mahajani | |
| '\u{11180}'..'\u{11181}' // [𑆀..𑆁] Sharada | |
| '\u{111b6}'..'\u{111be}' // [𑆶..𑆾] Sharada | |
| '\u{111ca}'..'\u{111cc}' // [𑇊..𑇌] Sharada | |
| '\u{1122f}'..'\u{11231}' // [𑈯..𑈱] Khojki | |
| '\u{11234}' // [𑈴] Khojki | |
| '\u{11236}'..'\u{11237}' // [𑈶..𑈷] Khojki | |
| '\u{1123e}' // [𑈾] Khojki | |
| '\u{112df}' // [𑋟] Khudawadi | |
| '\u{112e3}'..'\u{112ea}' // [𑋣..𑋪] Khudawadi | |
| '\u{11300}'..'\u{11301}' // [𑌀..𑌁] Grantha | |
| '\u{1133c}' // [𑌼] Grantha | |
| '\u{11340}' // [𑍀] Grantha | |
| '\u{11366}'..'\u{11374}' // [𑍦..𑍴] Grantha | |
| '\u{11438}'..'\u{1143f}' // [𑐸..𑐿] Newa | |
| '\u{11442}'..'\u{11444}' // [𑑂..𑑄] Newa | |
| '\u{11446}' // [𑑆] Newa | |
| '\u{114b3}'..'\u{114b8}' // [𑒳..𑒸] Tirhuta | |
| '\u{114ba}' // [𑒺] Tirhuta | |
| '\u{114bf}'..'\u{114c0}' // [𑒿..𑓀] Tirhuta | |
| '\u{114c2}'..'\u{114c3}' // [𑓂..𑓃] Tirhuta | |
| '\u{115b2}'..'\u{115b5}' // [𑖲..𑖵] Siddham | |
| '\u{115bc}'..'\u{115bd}' // [𑖼..𑖽] Siddham | |
| '\u{115bf}'..'\u{115c0}' // [𑖿..𑗀] Siddham | |
| '\u{115dc}'..'\u{115dd}' // [𑗜..𑗝] Siddham | |
| '\u{11633}'..'\u{1163a}' // [𑘳..𑘺] Modi | |
| '\u{1163d}' // [𑘽] Modi | |
| '\u{1163f}'..'\u{11640}' // [𑘿..𑙀] Modi | |
| '\u{116ab}' // [𑚫] Takri | |
| '\u{116ad}' // [𑚭] Takri | |
| '\u{116b0}'..'\u{116b5}' // [𑚰..𑚵] Takri | |
| '\u{116b7}' // [𑚷] Takri | |
| '\u{1171d}'..'\u{1171f}' // [𑜝..𑜟] Ahom | |
| '\u{11722}'..'\u{11725}' // [𑜢..𑜥] Ahom | |
| '\u{11727}'..'\u{1172b}' // [𑜧..𑜫] Ahom | |
| '\u{11c30}'..'\u{11c3d}' // [𑰰..𑰽] Bhaiksuki | |
| '\u{11c3f}' // [𑰿] Bhaiksuki | |
| '\u{11c92}'..'\u{11ca7}' // [𑲒..𑲧] Marchen | |
| '\u{11caa}'..'\u{11cb0}' // [𑲪..𑲰] Marchen | |
| '\u{11cb2}'..'\u{11cb3}' // [𑲲..𑲳] Marchen | |
| '\u{11cb5}'..'\u{11cb6}' // [𑲵..𑲶] Marchen | |
| '\u{16af0}'..'\u{16af4}' // [𖫰..𖫴] Bassa Vah | |
| '\u{16b30}'..'\u{16b36}' // [𖬰..𖬶] Pahawh Hmong | |
| '\u{16f8f}'..'\u{16f92}' // [𖾏..𖾒] Miao | |
| '\u{1bc9d}'..'\u{1bc9e}' // [𛲝..𛲞] Duployan | |
| '\u{1d167}'..'\u{1d169}' // [𝅧..𝅩] Musical Symbols | |
| '\u{1d17b}'..'\u{1d182}' // [𝅻..𝆂] Musical Symbols | |
| '\u{1d185}'..'\u{1d18b}' // [𝆅..𝆋] Musical Symbols | |
| '\u{1d1aa}'..'\u{1d1ad}' // [𝆪..𝆭] Musical Symbols | |
| '\u{1d242}'..'\u{1d244}' // [𝉂..𝉄] Ancient Greek Musical Notation | |
| '\u{1da00}'..'\u{1da36}' // [𝨀..𝨶] Sutton SignWriting | |
| '\u{1da3b}'..'\u{1da6c}' // [𝨻..𝩬] Sutton SignWriting | |
| '\u{1da75}' // [𝩵] Sutton SignWriting | |
| '\u{1da84}' // [𝪄] Sutton SignWriting | |
| '\u{1da9b}'..'\u{1e02a}' // [𝪛..𞀪] Sutton SignWriting | |
| '\u{1e8d0}'..'\u{1e8d6}' // [𞣐..𞣖] Mende Kikakui | |
| '\u{1e944}'..'\u{1e94a}' // [𞥄..𞥊] Adlam | |
| '\u{e0100}'..'\u{e01ef}' // [󠄀..󠇯] Variation Selectors Supplement | |
; | |
CLASSIFY_Nd: // digit | |
'\u{0030}'..'\u{0039}' // [0..9] Basic Latin | |
| '\u{0660}'..'\u{0669}' // [٠..٩] Arabic | |
| '\u{06f0}'..'\u{06f9}' // [۰..۹] Arabic | |
| '\u{07c0}'..'\u{07c9}' // [߀..߉] NKo | |
| '\u{0966}'..'\u{096f}' // [०..९] Devanagari | |
| '\u{09e6}'..'\u{09ef}' // [০..৯] Bengali | |
| '\u{0a66}'..'\u{0a6f}' // [੦..੯] Gurmukhi | |
| '\u{0ae6}'..'\u{0aef}' // [૦..૯] Gujarati | |
| '\u{0b66}'..'\u{0b6f}' // [୦..୯] Oriya | |
| '\u{0be6}'..'\u{0bef}' // [௦..௯] Tamil | |
| '\u{0c66}'..'\u{0c6f}' // [౦..౯] Telugu | |
| '\u{0ce6}'..'\u{0cef}' // [೦..೯] Kannada | |
| '\u{0d66}'..'\u{0d6f}' // [൦..൯] Malayalam | |
| '\u{0de6}'..'\u{0def}' // [෦..෯] Sinhala | |
| '\u{0e50}'..'\u{0e59}' // [๐..๙] Thai | |
| '\u{0ed0}'..'\u{0ed9}' // [໐..໙] Lao | |
| '\u{0f20}'..'\u{0f29}' // [༠..༩] Tibetan | |
| '\u{1040}'..'\u{1049}' // [၀..၉] Myanmar | |
| '\u{1090}'..'\u{1099}' // [႐..႙] Myanmar | |
| '\u{17e0}'..'\u{17e9}' // [០..៩] Khmer | |
| '\u{1810}'..'\u{1819}' // [᠐..᠙] Mongolian | |
| '\u{1946}'..'\u{194f}' // [᥆..᥏] Limbu | |
| '\u{19d0}'..'\u{19d9}' // [᧐..᧙] New Tai Lue | |
| '\u{1a80}'..'\u{1a99}' // [᪀..᪙] Tai Tham | |
| '\u{1b50}'..'\u{1b59}' // [᭐..᭙] Balinese | |
| '\u{1bb0}'..'\u{1bb9}' // [᮰..᮹] Sundanese | |
| '\u{1c40}'..'\u{1c49}' // [᱀..᱉] Lepcha | |
| '\u{1c50}'..'\u{1c59}' // [᱐..᱙] Ol Chiki | |
| '\u{a620}'..'\u{a629}' // [꘠..꘩] Vai | |
| '\u{a8d0}'..'\u{a8d9}' // [꣐..꣙] Saurashtra | |
| '\u{a900}'..'\u{a909}' // [꤀..꤉] Kayah Li | |
| '\u{a9d0}'..'\u{a9d9}' // [꧐..꧙] Javanese | |
| '\u{a9f0}'..'\u{a9f9}' // [꧰..꧹] Myanmar Extended-B | |
| '\u{aa50}'..'\u{aa59}' // [꩐..꩙] Cham | |
| '\u{abf0}'..'\u{abf9}' // [꯰..꯹] Meetei Mayek | |
| '\u{ff10}'..'\u{ff19}' // [0..9] Halfwidth and Fullwidth Forms | |
| '\u{104a0}'..'\u{104a9}' // [𐒠..𐒩] Osmanya | |
| '\u{11066}'..'\u{1106f}' // [𑁦..𑁯] Brahmi | |
| '\u{110f0}'..'\u{110f9}' // [𑃰..𑃹] Sora Sompeng | |
| '\u{11136}'..'\u{1113f}' // [𑄶..𑄿] Chakma | |
| '\u{111d0}'..'\u{111d9}' // [𑇐..𑇙] Sharada | |
| '\u{112f0}'..'\u{112f9}' // [𑋰..𑋹] Khudawadi | |
| '\u{11450}'..'\u{11459}' // [𑑐..𑑙] Newa | |
| '\u{114d0}'..'\u{114d9}' // [𑓐..𑓙] Tirhuta | |
| '\u{11650}'..'\u{11659}' // [𑙐..𑙙] Modi | |
| '\u{116c0}'..'\u{116c9}' // [𑛀..𑛉] Takri | |
| '\u{11730}'..'\u{11739}' // [𑜰..𑜹] Ahom | |
| '\u{118e0}'..'\u{118e9}' // [𑣠..𑣩] Warang Citi | |
| '\u{11c50}'..'\u{11c59}' // [𑱐..𑱙] Bhaiksuki | |
| '\u{16a60}'..'\u{16a69}' // [𖩠..𖩩] Mro | |
| '\u{16b50}'..'\u{16b59}' // [𖭐..𖭙] Pahawh Hmong | |
| '\u{1d7ce}'..'\u{1d7ff}' // [𝟎..𝟿] Mathematical Alphanumeric Symbols | |
| '\u{1e950}'..'\u{1e959}' // [𞥐..𞥙] Adlam | |
; | |
CLASSIFY_Nl: // Letter_Number | |
'\u{16ee}'..'\u{16f0}' // [ᛮ..ᛰ] Runic | |
| '\u{2160}'..'\u{2182}' // [Ⅰ..ↂ] Number Forms | |
| '\u{2185}'..'\u{2188}' // [ↅ..ↈ] Number Forms | |
| '\u{3007}' // [〇] CJK Symbols and Punctuation | |
| '\u{3021}'..'\u{3029}' // [〡..〩] CJK Symbols and Punctuation | |
| '\u{3038}'..'\u{303a}' // [〸..〺] CJK Symbols and Punctuation | |
| '\u{a6e6}'..'\u{a6ef}' // [ꛦ..ꛯ] Bamum | |
| '\u{10140}'..'\u{10174}' // [𐅀..𐅴] Ancient Greek Numbers | |
| '\u{10341}' // [𐍁] Gothic | |
| '\u{1034a}' // [𐍊] Gothic | |
| '\u{103d1}'..'\u{103d5}' // [𐏑..𐏕] Old Persian | |
| '\u{12400}'..'\u{1246e}' // [𒐀..𒑮] Cuneiform Numbers and Punctuation | |
; | |
CLASSIFY_No: // Other_Number | |
'\u{00b2}'..'\u{00b3}' // [²..³] Latin-1 Supplement | |
| '\u{00b9}' // [¹] Latin-1 Supplement | |
| '\u{00bc}'..'\u{00be}' // [¼..¾] Latin-1 Supplement | |
| '\u{09f4}'..'\u{09f9}' // [৴..৹] Bengali | |
| '\u{0b72}'..'\u{0b77}' // [୲..୷] Oriya | |
| '\u{0bf0}'..'\u{0bf2}' // [௰..௲] Tamil | |
| '\u{0c78}'..'\u{0c7e}' // [౸..౾] Telugu | |
| '\u{0d58}'..'\u{0d5e}' // [൘..൞] Malayalam | |
| '\u{0d70}'..'\u{0d78}' // [൰..൸] Malayalam | |
| '\u{0f2a}'..'\u{0f33}' // [༪..༳] Tibetan | |
| '\u{1369}'..'\u{137c}' // [፩..፼] Ethiopic | |
| '\u{17f0}'..'\u{17f9}' // [៰..៹] Khmer | |
| '\u{19da}' // [᧚] New Tai Lue | |
| '\u{2070}' // [⁰] Superscripts and Subscripts | |
| '\u{2074}'..'\u{2079}' // [⁴..⁹] Superscripts and Subscripts | |
| '\u{2080}'..'\u{2089}' // [₀..₉] Superscripts and Subscripts | |
| '\u{2150}'..'\u{215f}' // [⅐..⅟] Number Forms | |
| '\u{2189}' // [↉] Number Forms | |
| '\u{2460}'..'\u{249b}' // [①..⒛] Enclosed Alphanumerics | |
| '\u{24ea}'..'\u{24ff}' // [⓪..⓿] Enclosed Alphanumerics | |
| '\u{2776}'..'\u{2793}' // [❶..➓] Dingbats | |
| '\u{2cfd}' // [⳽] Coptic | |
| '\u{3192}'..'\u{3195}' // [㆒..㆕] Kanbun | |
| '\u{3220}'..'\u{3229}' // [㈠..㈩] Enclosed CJK Letters and Months | |
| '\u{3248}'..'\u{324f}' // [㉈..㉏] Enclosed CJK Letters and Months | |
| '\u{3251}'..'\u{325f}' // [㉑..㉟] Enclosed CJK Letters and Months | |
| '\u{3280}'..'\u{3289}' // [㊀..㊉] Enclosed CJK Letters and Months | |
| '\u{32b1}'..'\u{32bf}' // [㊱..㊿] Enclosed CJK Letters and Months | |
| '\u{a830}'..'\u{a835}' // [꠰..꠵] Common Indic Number Forms | |
| '\u{10107}'..'\u{10133}' // [𐄇..𐄳] Aegean Numbers | |
| '\u{10175}'..'\u{10178}' // [𐅵..𐅸] Ancient Greek Numbers | |
| '\u{1018a}'..'\u{1018b}' // [𐆊..𐆋] Ancient Greek Numbers | |
| '\u{102e1}'..'\u{102fb}' // [𐋡..𐋻] Coptic Epact Numbers | |
| '\u{10320}'..'\u{10323}' // [𐌠..𐌣] Old Italic | |
| '\u{10858}'..'\u{1085f}' // [𐡘..𐡟] Imperial Aramaic | |
| '\u{10879}'..'\u{1087f}' // [𐡹..𐡿] Palmyrene | |
| '\u{108a7}'..'\u{108af}' // [𐢧..𐢯] Nabataean | |
| '\u{108fb}'..'\u{108ff}' // [𐣻..𐣿] Hatran | |
| '\u{10916}'..'\u{1091b}' // [𐤖..𐤛] Phoenician | |
| '\u{109bc}'..'\u{109bd}' // [𐦼..𐦽] Meroitic Cursive | |
| '\u{109c0}'..'\u{109ff}' // [𐧀..𐧿] Meroitic Cursive | |
| '\u{10a40}'..'\u{10a47}' // [𐩀..𐩇] Kharoshthi | |
| '\u{10a7d}'..'\u{10a7e}' // [𐩽..𐩾] Old South Arabian | |
| '\u{10a9d}'..'\u{10a9f}' // [𐪝..𐪟] Old North Arabian | |
| '\u{10aeb}'..'\u{10aef}' // [𐫫..𐫯] Manichaean | |
| '\u{10b58}'..'\u{10b5f}' // [𐭘..𐭟] Inscriptional Parthian | |
| '\u{10b78}'..'\u{10b7f}' // [𐭸..𐭿] Inscriptional Pahlavi | |
| '\u{10ba9}'..'\u{10baf}' // [𐮩..𐮯] Psalter Pahlavi | |
| '\u{10cfa}'..'\u{10e7e}' // [𐳺..𐹾] Old Hungarian | |
| '\u{11052}'..'\u{11065}' // [𑁒..𑁥] Brahmi | |
| '\u{111e1}'..'\u{111f4}' // [𑇡..𑇴] Sinhala Archaic Numbers | |
| '\u{1173a}'..'\u{1173b}' // [𑜺..𑜻] Ahom | |
| '\u{118ea}'..'\u{118f2}' // [𑣪..𑣲] Warang Citi | |
| '\u{11c5a}'..'\u{11c6c}' // [𑱚..𑱬] Bhaiksuki | |
| '\u{16b5b}'..'\u{16b61}' // [𖭛..𖭡] Pahawh Hmong | |
| '\u{1d360}'..'\u{1d371}' // [𝍠..𝍱] Counting Rod Numerals | |
| '\u{1e8c7}'..'\u{1e8cf}' // [𞣇..𞣏] Mende Kikakui | |
| '\u{1f100}'..'\u{1f10c}' // [🄀..🄌] Enclosed Alphanumeric Supplement | |
; | |
CLASSIFY_Pc: // Connector_Punctuation | |
'\u{005f}' // [_] Basic Latin | |
| '\u{203f}'..'\u{2040}' // [‿..⁀] General Punctuation | |
| '\u{2054}' // [⁔] General Punctuation | |
| '\u{fe33}'..'\u{fe34}' // [︳..︴] CJK Compatibility Forms | |
| '\u{fe4d}'..'\u{fe4f}' // [﹍..﹏] CJK Compatibility Forms | |
| '\u{ff3f}' // [_] Halfwidth and Fullwidth Forms | |
; | |
CLASSIFY_Pd: // Dash_Punctuation | |
'\u{002d}' // [-] Basic Latin | |
| '\u{058a}' // [֊] Armenian | |
| '\u{05be}' // [־] Hebrew | |
| '\u{1400}' // [᐀] Unified Canadian Aboriginal Syllabics | |
| '\u{1806}' // [᠆] Mongolian | |
| '\u{2010}'..'\u{2015}' // [‐..―] General Punctuation | |
| '\u{2e17}' // [⸗] Supplemental Punctuation | |
| '\u{2e1a}' // [⸚] Supplemental Punctuation | |
| '\u{2e3a}'..'\u{2e3b}' // [⸺..⸻] Supplemental Punctuation | |
| '\u{2e40}' // [⹀] Supplemental Punctuation | |
| '\u{301c}' // [〜] CJK Symbols and Punctuation | |
| '\u{3030}' // [〰] CJK Symbols and Punctuation | |
| '\u{30a0}' // [゠] Katakana | |
| '\u{fe31}'..'\u{fe32}' // [︱..︲] CJK Compatibility Forms | |
| '\u{fe58}' // [﹘] Small Form Variants | |
| '\u{fe63}' // [﹣] Small Form Variants | |
| '\u{ff0d}' // [-] Halfwidth and Fullwidth Forms | |
; | |
CLASSIFY_Pe: // Close_Punctuation | |
'\u{0029}' // [)] Basic Latin | |
| '\u{005d}' // []] Basic Latin | |
| '\u{007d}' // [}] Basic Latin | |
| '\u{0f3b}' // [༻] Tibetan | |
| '\u{0f3d}' // [༽] Tibetan | |
| '\u{169c}' // [᚜] Ogham | |
| '\u{2046}' // [⁆] General Punctuation | |
| '\u{207e}' // [⁾] Superscripts and Subscripts | |
| '\u{208e}' // [₎] Superscripts and Subscripts | |
| '\u{2309}' // [⌉] Miscellaneous Technical | |
| '\u{230b}' // [⌋] Miscellaneous Technical | |
| '\u{232a}' // [〉] Miscellaneous Technical | |
| '\u{2769}' // [❩] Dingbats | |
| '\u{276b}' // [❫] Dingbats | |
| '\u{276d}' // [❭] Dingbats | |
| '\u{276f}' // [❯] Dingbats | |
| '\u{2771}' // [❱] Dingbats | |
| '\u{2773}' // [❳] Dingbats | |
| '\u{2775}' // [❵] Dingbats | |
| '\u{27c6}' // [⟆] Miscellaneous Mathematical Symbols-A | |
| '\u{27e7}' // [⟧] Miscellaneous Mathematical Symbols-A | |
| '\u{27e9}' // [⟩] Miscellaneous Mathematical Symbols-A | |
| '\u{27eb}' // [⟫] Miscellaneous Mathematical Symbols-A | |
| '\u{27ed}' // [⟭] Miscellaneous Mathematical Symbols-A | |
| '\u{27ef}' // [⟯] Miscellaneous Mathematical Symbols-A | |
| '\u{2984}' // [⦄] Miscellaneous Mathematical Symbols-B | |
| '\u{2986}' // [⦆] Miscellaneous Mathematical Symbols-B | |
| '\u{2988}' // [⦈] Miscellaneous Mathematical Symbols-B | |
| '\u{298a}' // [⦊] Miscellaneous Mathematical Symbols-B | |
| '\u{298c}' // [⦌] Miscellaneous Mathematical Symbols-B | |
| '\u{298e}' // [⦎] Miscellaneous Mathematical Symbols-B | |
| '\u{2990}' // [⦐] Miscellaneous Mathematical Symbols-B | |
| '\u{2992}' // [⦒] Miscellaneous Mathematical Symbols-B | |
| '\u{2994}' // [⦔] Miscellaneous Mathematical Symbols-B | |
| '\u{2996}' // [⦖] Miscellaneous Mathematical Symbols-B | |
| '\u{2998}' // [⦘] Miscellaneous Mathematical Symbols-B | |
| '\u{29d9}' // [⧙] Miscellaneous Mathematical Symbols-B | |
| '\u{29db}' // [⧛] Miscellaneous Mathematical Symbols-B | |
| '\u{29fd}' // [⧽] Miscellaneous Mathematical Symbols-B | |
| '\u{2e23}' // [⸣] Supplemental Punctuation | |
| '\u{2e25}' // [⸥] Supplemental Punctuation | |
| '\u{2e27}' // [⸧] Supplemental Punctuation | |
| '\u{2e29}' // [⸩] Supplemental Punctuation | |
| '\u{3009}' // [〉] CJK Symbols and Punctuation | |
| '\u{300b}' // [》] CJK Symbols and Punctuation | |
| '\u{300d}' // [」] CJK Symbols and Punctuation | |
| '\u{300f}' // [』] CJK Symbols and Punctuation | |
| '\u{3011}' // [】] CJK Symbols and Punctuation | |
| '\u{3015}' // [〕] CJK Symbols and Punctuation | |
| '\u{3017}' // [〗] CJK Symbols and Punctuation | |
| '\u{3019}' // [〙] CJK Symbols and Punctuation | |
| '\u{301b}' // [〛] CJK Symbols and Punctuation | |
| '\u{301e}'..'\u{301f}' // [〞..〟] CJK Symbols and Punctuation | |
| '\u{fd3e}' // [﴾] Arabic Presentation Forms-A | |
| '\u{fe18}' // [︘] Vertical Forms | |
| '\u{fe36}' // [︶] CJK Compatibility Forms | |
| '\u{fe38}' // [︸] CJK Compatibility Forms | |
| '\u{fe3a}' // [︺] CJK Compatibility Forms | |
| '\u{fe3c}' // [︼] CJK Compatibility Forms | |
| '\u{fe3e}' // [︾] CJK Compatibility Forms | |
| '\u{fe40}' // [﹀] CJK Compatibility Forms | |
| '\u{fe42}' // [﹂] CJK Compatibility Forms | |
| '\u{fe44}' // [﹄] CJK Compatibility Forms | |
| '\u{fe48}' // [﹈] CJK Compatibility Forms | |
| '\u{fe5a}' // [﹚] Small Form Variants | |
| '\u{fe5c}' // [﹜] Small Form Variants | |
| '\u{fe5e}' // [﹞] Small Form Variants | |
| '\u{ff09}' // [)] Halfwidth and Fullwidth Forms | |
| '\u{ff3d}' // []] Halfwidth and Fullwidth Forms | |
| '\u{ff5d}' // [}] Halfwidth and Fullwidth Forms | |
| '\u{ff60}' // [⦆] Halfwidth and Fullwidth Forms | |
| '\u{ff63}' // [」] Halfwidth and Fullwidth Forms | |
; | |
CLASSIFY_Pf: // Final_Punctuation | |
'\u{00bb}' // [»] Latin-1 Supplement | |
| '\u{2019}' // [’] General Punctuation | |
| '\u{201d}' // [”] General Punctuation | |
| '\u{203a}' // [›] General Punctuation | |
| '\u{2e03}' // [⸃] Supplemental Punctuation | |
| '\u{2e05}' // [⸅] Supplemental Punctuation | |
| '\u{2e0a}' // [⸊] Supplemental Punctuation | |
| '\u{2e0d}' // [⸍] Supplemental Punctuation | |
| '\u{2e1d}' // [⸝] Supplemental Punctuation | |
| '\u{2e21}' // [⸡] Supplemental Punctuation | |
; | |
CLASSIFY_Pi: // Initial_Punctuation | |
'\u{00ab}' // [«] Latin-1 Supplement | |
| '\u{2018}' // [‘] General Punctuation | |
| '\u{201b}'..'\u{201c}' // [‛..“] General Punctuation | |
| '\u{201f}' // [‟] General Punctuation | |
| '\u{2039}' // [‹] General Punctuation | |
| '\u{2e02}' // [⸂] Supplemental Punctuation | |
| '\u{2e04}' // [⸄] Supplemental Punctuation | |
| '\u{2e09}' // [⸉] Supplemental Punctuation | |
| '\u{2e0c}' // [⸌] Supplemental Punctuation | |
| '\u{2e1c}' // [⸜] Supplemental Punctuation | |
| '\u{2e20}' // [⸠] Supplemental Punctuation | |
; | |
CLASSIFY_Po: // Other_Punctuation | |
'\u{0021}'..'\u{0023}' // [!..#] Basic Latin | |
| '\u{0025}'..'\u{0027}' // [%..'] Basic Latin | |
| '\u{002a}' // [*] Basic Latin | |
| '\u{002c}' // [,] Basic Latin | |
| '\u{002e}'..'\u{002f}' // [.../] Basic Latin | |
| '\u{003a}'..'\u{003b}' // [:..;] Basic Latin | |
| '\u{003f}'..'\u{0040}' // [?..@] Basic Latin | |
| '\u{005c}' // [\] Basic Latin | |
| '\u{00a1}' // [¡] Latin-1 Supplement | |
| '\u{00a7}' // [§] Latin-1 Supplement | |
| '\u{00b6}'..'\u{00b7}' // [¶..·] Latin-1 Supplement | |
| '\u{00bf}' // [¿] Latin-1 Supplement | |
| '\u{037e}' // [;] Greek and Coptic | |
| '\u{0387}' // [·] Greek and Coptic | |
| '\u{055a}'..'\u{055f}' // [՚..՟] Armenian | |
| '\u{0589}' // [։] Armenian | |
| '\u{05c0}' // [׀] Hebrew | |
| '\u{05c3}' // [׃] Hebrew | |
| '\u{05c6}' // [׆] Hebrew | |
| '\u{05f3}'..'\u{05f4}' // [׳..״] Hebrew | |
| '\u{0609}'..'\u{060a}' // [؉..؊] Arabic | |
| '\u{060c}'..'\u{060d}' // [،..؍] Arabic | |
| '\u{061b}' // [؛] Arabic | |
| '\u{061e}'..'\u{061f}' // [؞..؟] Arabic | |
| '\u{066a}'..'\u{066d}' // [٪..٭] Arabic | |
| '\u{06d4}' // [۔] Arabic | |
| '\u{0700}'..'\u{070d}' // [܀..܍] Syriac | |
| '\u{07f7}'..'\u{07f9}' // [߷..߹] NKo | |
| '\u{0830}'..'\u{083e}' // [࠰..࠾] Samaritan | |
| '\u{085e}' // [࡞] Mandaic | |
| '\u{0964}'..'\u{0965}' // [।..॥] Devanagari | |
| '\u{0970}' // [॰] Devanagari | |
| '\u{0af0}' // [૰] Gujarati | |
| '\u{0df4}' // [෴] Sinhala | |
| '\u{0e4f}' // [๏] Thai | |
| '\u{0e5a}'..'\u{0e5b}' // [๚..๛] Thai | |
| '\u{0f04}'..'\u{0f12}' // [༄..༒] Tibetan | |
| '\u{0f14}' // [༔] Tibetan | |
| '\u{0f85}' // [྅] Tibetan | |
| '\u{0fd0}'..'\u{0fd4}' // [࿐..࿔] Tibetan | |
| '\u{0fd9}'..'\u{0fda}' // [࿙..࿚] Tibetan | |
| '\u{104a}'..'\u{104f}' // [၊..၏] Myanmar | |
| '\u{10fb}' // [჻] Georgian | |
| '\u{1360}'..'\u{1368}' // [፠..፨] Ethiopic | |
| '\u{166d}'..'\u{166e}' // [᙭..᙮] Unified Canadian Aboriginal Syllabics | |
| '\u{16eb}'..'\u{16ed}' // [᛫..᛭] Runic | |
| '\u{1735}'..'\u{1736}' // [᜵..᜶] Hanunoo | |
| '\u{17d4}'..'\u{17d6}' // [។..៖] Khmer | |
| '\u{17d8}'..'\u{17da}' // [៘..៚] Khmer | |
| '\u{1800}'..'\u{1805}' // [᠀..᠅] Mongolian | |
| '\u{1807}'..'\u{180a}' // [᠇..᠊] Mongolian | |
| '\u{1944}'..'\u{1945}' // [᥄..᥅] Limbu | |
| '\u{1a1e}'..'\u{1a1f}' // [᨞..᨟] Buginese | |
| '\u{1aa0}'..'\u{1aa6}' // [᪠..᪦] Tai Tham | |
| '\u{1aa8}'..'\u{1aad}' // [᪨..᪭] Tai Tham | |
| '\u{1b5a}'..'\u{1b60}' // [᭚..᭠] Balinese | |
| '\u{1bfc}'..'\u{1bff}' // [᯼..᯿] Batak | |
| '\u{1c3b}'..'\u{1c3f}' // [᰻..᰿] Lepcha | |
| '\u{1c7e}'..'\u{1c7f}' // [᱾..᱿] Ol Chiki | |
| '\u{1cc0}'..'\u{1cc7}' // [᳀..᳇] Sundanese Supplement | |
| '\u{1cd3}' // [᳓] Vedic Extensions | |
| '\u{2016}'..'\u{2017}' // [‖..‗] General Punctuation | |
| '\u{2020}'..'\u{2027}' // [†..‧] General Punctuation | |
| '\u{2030}'..'\u{2038}' // [‰..‸] General Punctuation | |
| '\u{203b}'..'\u{203e}' // [※..‾] General Punctuation | |
| '\u{2041}'..'\u{2043}' // [⁁..⁃] General Punctuation | |
| '\u{2047}'..'\u{2051}' // [⁇..⁑] General Punctuation | |
| '\u{2053}' // [⁓] General Punctuation | |
| '\u{2055}'..'\u{205e}' // [⁕..⁞] General Punctuation | |
| '\u{2cf9}'..'\u{2cfc}' // [⳹..⳼] Coptic | |
| '\u{2cfe}'..'\u{2cff}' // [⳾..⳿] Coptic | |
| '\u{2d70}' // [⵰] Tifinagh | |
| '\u{2e00}'..'\u{2e01}' // [⸀..⸁] Supplemental Punctuation | |
| '\u{2e06}'..'\u{2e08}' // [⸆..⸈] Supplemental Punctuation | |
| '\u{2e0b}' // [⸋] Supplemental Punctuation | |
| '\u{2e0e}'..'\u{2e16}' // [⸎..⸖] Supplemental Punctuation | |
| '\u{2e18}'..'\u{2e19}' // [⸘..⸙] Supplemental Punctuation | |
| '\u{2e1b}' // [⸛] Supplemental Punctuation | |
| '\u{2e1e}'..'\u{2e1f}' // [⸞..⸟] Supplemental Punctuation | |
| '\u{2e2a}'..'\u{2e2e}' // [⸪..⸮] Supplemental Punctuation | |
| '\u{2e30}'..'\u{2e39}' // [⸰..⸹] Supplemental Punctuation | |
| '\u{2e3c}'..'\u{2e3f}' // [⸼..⸿] Supplemental Punctuation | |
| '\u{2e41}' // [⹁] Supplemental Punctuation | |
| '\u{2e43}'..'\u{2e44}' // [⹃..⹄] Supplemental Punctuation | |
| '\u{3001}'..'\u{3003}' // [、..〃] CJK Symbols and Punctuation | |
| '\u{303d}' // [〽] CJK Symbols and Punctuation | |
| '\u{30fb}' // [・] Katakana | |
| '\u{a4fe}'..'\u{a4ff}' // [꓾..꓿] Lisu | |
| '\u{a60d}'..'\u{a60f}' // [꘍..꘏] Vai | |
| '\u{a673}' // [꙳] Cyrillic Extended-B | |
| '\u{a67e}' // [꙾] Cyrillic Extended-B | |
| '\u{a6f2}'..'\u{a6f7}' // [꛲..꛷] Bamum | |
| '\u{a874}'..'\u{a877}' // [꡴..꡷] Phags-pa | |
| '\u{a8ce}'..'\u{a8cf}' // [꣎..꣏] Saurashtra | |
| '\u{a8f8}'..'\u{a8fa}' // [꣸..꣺] Devanagari Extended | |
| '\u{a8fc}' // [꣼] Devanagari Extended | |
| '\u{a92e}'..'\u{a92f}' // [꤮..꤯] Kayah Li | |
| '\u{a95f}' // [꥟] Rejang | |
| '\u{a9c1}'..'\u{a9cd}' // [꧁..꧍] Javanese | |
| '\u{a9de}'..'\u{a9df}' // [꧞..꧟] Javanese | |
| '\u{aa5c}'..'\u{aa5f}' // [꩜..꩟] Cham | |
| '\u{aade}'..'\u{aadf}' // [꫞..꫟] Tai Viet | |
| '\u{aaf0}'..'\u{aaf1}' // [꫰..꫱] Meetei Mayek Extensions | |
| '\u{abeb}' // [꯫] Meetei Mayek | |
| '\u{fe10}'..'\u{fe16}' // [︐..︖] Vertical Forms | |
| '\u{fe19}' // [︙] Vertical Forms | |
| '\u{fe30}' // [︰] CJK Compatibility Forms | |
| '\u{fe45}'..'\u{fe46}' // [﹅..﹆] CJK Compatibility Forms | |
| '\u{fe49}'..'\u{fe4c}' // [﹉..﹌] CJK Compatibility Forms | |
| '\u{fe50}'..'\u{fe57}' // [﹐..﹗] Small Form Variants | |
| '\u{fe5f}'..'\u{fe61}' // [﹟..﹡] Small Form Variants | |
| '\u{fe68}' // [﹨] Small Form Variants | |
| '\u{fe6a}'..'\u{fe6b}' // [﹪..﹫] Small Form Variants | |
| '\u{ff01}'..'\u{ff03}' // [!..#] Halfwidth and Fullwidth Forms | |
| '\u{ff05}'..'\u{ff07}' // [%..'] Halfwidth and Fullwidth Forms | |
| '\u{ff0a}' // [*] Halfwidth and Fullwidth Forms | |
| '\u{ff0c}' // [,] Halfwidth and Fullwidth Forms | |
| '\u{ff0e}'..'\u{ff0f}' // [.../] Halfwidth and Fullwidth Forms | |
| '\u{ff1a}'..'\u{ff1b}' // [:..;] Halfwidth and Fullwidth Forms | |
| '\u{ff1f}'..'\u{ff20}' // [?..@] Halfwidth and Fullwidth Forms | |
| '\u{ff3c}' // [\] Halfwidth and Fullwidth Forms | |
| '\u{ff61}' // [。] Halfwidth and Fullwidth Forms | |
| '\u{ff64}'..'\u{ff65}' // [、..・] Halfwidth and Fullwidth Forms | |
| '\u{10100}'..'\u{10102}' // [𐄀..𐄂] Aegean Numbers | |
| '\u{1039f}' // [𐎟] Ugaritic | |
| '\u{103d0}' // [𐏐] Old Persian | |
| '\u{1056f}' // [𐕯] Caucasian Albanian | |
| '\u{10857}' // [𐡗] Imperial Aramaic | |
| '\u{1091f}' // [𐤟] Phoenician | |
| '\u{1093f}' // [𐤿] Lydian | |
| '\u{10a50}'..'\u{10a58}' // [𐩐..𐩘] Kharoshthi | |
| '\u{10a7f}' // [𐩿] Old South Arabian | |
| '\u{10af0}'..'\u{10af6}' // [𐫰..𐫶] Manichaean | |
| '\u{10b39}'..'\u{10b3f}' // [𐬹..𐬿] Avestan | |
| '\u{10b99}'..'\u{10b9c}' // [𐮙..𐮜] Psalter Pahlavi | |
| '\u{11047}'..'\u{1104d}' // [𑁇..𑁍] Brahmi | |
| '\u{110bb}'..'\u{110bc}' // [𑂻..𑂼] Kaithi | |
| '\u{110be}'..'\u{110c1}' // [𑂾..𑃁] Kaithi | |
| '\u{11140}'..'\u{11143}' // [𑅀..𑅃] Chakma | |
| '\u{11174}'..'\u{11175}' // [𑅴..𑅵] Mahajani | |
| '\u{111c5}'..'\u{111c9}' // [𑇅..𑇉] Sharada | |
| '\u{111cd}' // [𑇍] Sharada | |
| '\u{111db}' // [𑇛] Sharada | |
| '\u{111dd}'..'\u{111df}' // [𑇝..𑇟] Sharada | |
| '\u{11238}'..'\u{1123d}' // [𑈸..𑈽] Khojki | |
| '\u{112a9}' // [𑊩] Multani | |
| '\u{1144b}'..'\u{1144f}' // [𑑋..𑑏] Newa | |
| '\u{1145b}'..'\u{1145d}' // [𑑛..𑑝] Newa | |
| '\u{114c6}' // [𑓆] Tirhuta | |
| '\u{115c1}'..'\u{115d7}' // [𑗁..𑗗] Siddham | |
| '\u{11641}'..'\u{11643}' // [𑙁..𑙃] Modi | |
| '\u{11660}'..'\u{1166c}' // [𑙠..𑙬] Mongolian Supplement | |
| '\u{1173c}'..'\u{1173e}' // [𑜼..𑜾] Ahom | |
| '\u{11c41}'..'\u{11c45}' // [𑱁..𑱅] Bhaiksuki | |
| '\u{11c70}'..'\u{11c71}' // [𑱰..𑱱] Marchen | |
| '\u{12470}'..'\u{12474}' // [𒑰..𒑴] Cuneiform Numbers and Punctuation | |
| '\u{16a6e}'..'\u{16a6f}' // [𖩮..𖩯] Mro | |
| '\u{16af5}' // [𖫵] Bassa Vah | |
| '\u{16b37}'..'\u{16b3b}' // [𖬷..𖬻] Pahawh Hmong | |
| '\u{16b44}' // [𖭄] Pahawh Hmong | |
| '\u{1bc9f}' // [𛲟] Duployan | |
| '\u{1da87}'..'\u{1da8b}' // [𝪇..𝪋] Sutton SignWriting | |
| '\u{1e95e}'..'\u{1e95f}' // [𞥞..𞥟] Adlam | |
; | |
CLASSIFY_Ps: // Open_Punctuation | |
'\u{0028}' // [(] Basic Latin | |
| '\u{005b}' // [[] Basic Latin | |
| '\u{007b}' // [{] Basic Latin | |
| '\u{0f3a}' // [༺] Tibetan | |
| '\u{0f3c}' // [༼] Tibetan | |
| '\u{169b}' // [᚛] Ogham | |
| '\u{201a}' // [‚] General Punctuation | |
| '\u{201e}' // [„] General Punctuation | |
| '\u{2045}' // [⁅] General Punctuation | |
| '\u{207d}' // [⁽] Superscripts and Subscripts | |
| '\u{208d}' // [₍] Superscripts and Subscripts | |
| '\u{2308}' // [⌈] Miscellaneous Technical | |
| '\u{230a}' // [⌊] Miscellaneous Technical | |
| '\u{2329}' // [〈] Miscellaneous Technical | |
| '\u{2768}' // [❨] Dingbats | |
| '\u{276a}' // [❪] Dingbats | |
| '\u{276c}' // [❬] Dingbats | |
| '\u{276e}' // [❮] Dingbats | |
| '\u{2770}' // [❰] Dingbats | |
| '\u{2772}' // [❲] Dingbats | |
| '\u{2774}' // [❴] Dingbats | |
| '\u{27c5}' // [⟅] Miscellaneous Mathematical Symbols-A | |
| '\u{27e6}' // [⟦] Miscellaneous Mathematical Symbols-A | |
| '\u{27e8}' // [⟨] Miscellaneous Mathematical Symbols-A | |
| '\u{27ea}' // [⟪] Miscellaneous Mathematical Symbols-A | |
| '\u{27ec}' // [⟬] Miscellaneous Mathematical Symbols-A | |
| '\u{27ee}' // [⟮] Miscellaneous Mathematical Symbols-A | |
| '\u{2983}' // [⦃] Miscellaneous Mathematical Symbols-B | |
| '\u{2985}' // [⦅] Miscellaneous Mathematical Symbols-B | |
| '\u{2987}' // [⦇] Miscellaneous Mathematical Symbols-B | |
| '\u{2989}' // [⦉] Miscellaneous Mathematical Symbols-B | |
| '\u{298b}' // [⦋] Miscellaneous Mathematical Symbols-B | |
| '\u{298d}' // [⦍] Miscellaneous Mathematical Symbols-B | |
| '\u{298f}' // [⦏] Miscellaneous Mathematical Symbols-B | |
| '\u{2991}' // [⦑] Miscellaneous Mathematical Symbols-B | |
| '\u{2993}' // [⦓] Miscellaneous Mathematical Symbols-B | |
| '\u{2995}' // [⦕] Miscellaneous Mathematical Symbols-B | |
| '\u{2997}' // [⦗] Miscellaneous Mathematical Symbols-B | |
| '\u{29d8}' // [⧘] Miscellaneous Mathematical Symbols-B | |
| '\u{29da}' // [⧚] Miscellaneous Mathematical Symbols-B | |
| '\u{29fc}' // [⧼] Miscellaneous Mathematical Symbols-B | |
| '\u{2e22}' // [⸢] Supplemental Punctuation | |
| '\u{2e24}' // [⸤] Supplemental Punctuation | |
| '\u{2e26}' // [⸦] Supplemental Punctuation | |
| '\u{2e28}' // [⸨] Supplemental Punctuation | |
| '\u{2e42}' // [⹂] Supplemental Punctuation | |
| '\u{3008}' // [〈] CJK Symbols and Punctuation | |
| '\u{300a}' // [《] CJK Symbols and Punctuation | |
| '\u{300c}' // [「] CJK Symbols and Punctuation | |
| '\u{300e}' // [『] CJK Symbols and Punctuation | |
| '\u{3010}' // [【] CJK Symbols and Punctuation | |
| '\u{3014}' // [〔] CJK Symbols and Punctuation | |
| '\u{3016}' // [〖] CJK Symbols and Punctuation | |
| '\u{3018}' // [〘] CJK Symbols and Punctuation | |
| '\u{301a}' // [〚] CJK Symbols and Punctuation | |
| '\u{301d}' // [〝] CJK Symbols and Punctuation | |
| '\u{fd3f}' // [﴿] Arabic Presentation Forms-A | |
| '\u{fe17}' // [︗] Vertical Forms | |
| '\u{fe35}' // [︵] CJK Compatibility Forms | |
| '\u{fe37}' // [︷] CJK Compatibility Forms | |
| '\u{fe39}' // [︹] CJK Compatibility Forms | |
| '\u{fe3b}' // [︻] CJK Compatibility Forms | |
| '\u{fe3d}' // [︽] CJK Compatibility Forms | |
| '\u{fe3f}' // [︿] CJK Compatibility Forms | |
| '\u{fe41}' // [﹁] CJK Compatibility Forms | |
| '\u{fe43}' // [﹃] CJK Compatibility Forms | |
| '\u{fe47}' // [﹇] CJK Compatibility Forms | |
| '\u{fe59}' // [﹙] Small Form Variants | |
| '\u{fe5b}' // [﹛] Small Form Variants | |
| '\u{fe5d}' // [﹝] Small Form Variants | |
| '\u{ff08}' // [(] Halfwidth and Fullwidth Forms | |
| '\u{ff3b}' // [[] Halfwidth and Fullwidth Forms | |
| '\u{ff5b}' // [{] Halfwidth and Fullwidth Forms | |
| '\u{ff5f}' // [⦅] Halfwidth and Fullwidth Forms | |
| '\u{ff62}' // [「] Halfwidth and Fullwidth Forms | |
; | |
CLASSIFY_Sc: // Currency_Symbol | |
'\u{0024}' // [$] Basic Latin | |
| '\u{00a2}'..'\u{00a5}' // [¢..¥] Latin-1 Supplement | |
| '\u{058f}' // [֏] Armenian | |
| '\u{060b}' // [؋] Arabic | |
| '\u{09f2}'..'\u{09f3}' // [৲..৳] Bengali | |
| '\u{09fb}' // [৻] Bengali | |
| '\u{0af1}' // [૱] Gujarati | |
| '\u{0bf9}' // [௹] Tamil | |
| '\u{0e3f}' // [฿] Thai | |
| '\u{17db}' // [៛] Khmer | |
| '\u{20a0}'..'\u{20be}' // [₠..₾] Currency Symbols | |
| '\u{a838}' // [꠸] Common Indic Number Forms | |
| '\u{fdfc}' // [﷼] Arabic Presentation Forms-A | |
| '\u{fe69}' // [﹩] Small Form Variants | |
| '\u{ff04}' // [$] Halfwidth and Fullwidth Forms | |
| '\u{ffe0}'..'\u{ffe1}' // [¢..£] Halfwidth and Fullwidth Forms | |
| '\u{ffe5}'..'\u{ffe6}' // [¥..₩] Halfwidth and Fullwidth Forms | |
; | |
CLASSIFY_Sk: // Modifier_Symbol | |
'\u{005e}' // [^] Basic Latin | |
| '\u{0060}' // [`] Basic Latin | |
| '\u{00a8}' // [¨] Latin-1 Supplement | |
| '\u{00af}' // [¯] Latin-1 Supplement | |
| '\u{00b4}' // [´] Latin-1 Supplement | |
| '\u{00b8}' // [¸] Latin-1 Supplement | |
| '\u{02c2}'..'\u{02c5}' // [˂..˅] Spacing Modifier Letters | |
| '\u{02d2}'..'\u{02df}' // [˒..˟] Spacing Modifier Letters | |
| '\u{02e5}'..'\u{02eb}' // [˥..˫] Spacing Modifier Letters | |
| '\u{02ed}' // [˭] Spacing Modifier Letters | |
| '\u{02ef}'..'\u{02ff}' // [˯..˿] Spacing Modifier Letters | |
| '\u{0375}' // [͵] Greek and Coptic | |
| '\u{0384}'..'\u{0385}' // [΄..΅] Greek and Coptic | |
| '\u{1fbd}' // [᾽] Greek Extended | |
| '\u{1fbf}'..'\u{1fc1}' // [᾿..῁] Greek Extended | |
| '\u{1fcd}'..'\u{1fcf}' // [῍..῏] Greek Extended | |
| '\u{1fdd}'..'\u{1fdf}' // [῝..῟] Greek Extended | |
| '\u{1fed}'..'\u{1fef}' // [῭..`] Greek Extended | |
| '\u{1ffd}'..'\u{1ffe}' // [´..῾] Greek Extended | |
| '\u{309b}'..'\u{309c}' // [゛..゜] Hiragana | |
| '\u{a700}'..'\u{a716}' // [꜀..꜖] Modifier Tone Letters | |
| '\u{a720}'..'\u{a721}' // [꜠..꜡] Latin Extended-D | |
| '\u{a789}'..'\u{a78a}' // [꞉..꞊] Latin Extended-D | |
| '\u{ab5b}' // [꭛] Latin Extended-E | |
| '\u{fbb2}'..'\u{fbc1}' // [﮲..﯁] Arabic Presentation Forms-A | |
| '\u{ff3e}' // [^] Halfwidth and Fullwidth Forms | |
| '\u{ff40}' // [`] Halfwidth and Fullwidth Forms | |
| '\u{ffe3}' // [ ̄] Halfwidth and Fullwidth Forms | |
| '\u{1f3fb}'..'\u{1f3ff}' // [🏻..🏿] Miscellaneous Symbols and Pictographs | |
; | |
CLASSIFY_Sm: // Math_Symbol | |
'\u{002b}' // [+] Basic Latin | |
| '\u{003c}'..'\u{003e}' // [<..>] Basic Latin | |
| '\u{007c}' // [|] Basic Latin | |
| '\u{007e}' // [~] Basic Latin | |
| '\u{00ac}' // [¬] Latin-1 Supplement | |
| '\u{00b1}' // [±] Latin-1 Supplement | |
| '\u{00d7}' // [×] Latin-1 Supplement | |
| '\u{00f7}' // [÷] Latin-1 Supplement | |
| '\u{03f6}' // [϶] Greek and Coptic | |
| '\u{0606}'..'\u{0608}' // [؆..؈] Arabic | |
| '\u{2044}' // [⁄] General Punctuation | |
| '\u{2052}' // [⁒] General Punctuation | |
| '\u{207a}'..'\u{207c}' // [⁺..⁼] Superscripts and Subscripts | |
| '\u{208a}'..'\u{208c}' // [₊..₌] Superscripts and Subscripts | |
| '\u{2118}' // [℘] Letterlike Symbols | |
| '\u{2140}'..'\u{2144}' // [⅀..⅄] Letterlike Symbols | |
| '\u{214b}' // [⅋] Letterlike Symbols | |
| '\u{2190}'..'\u{2194}' // [←..↔] Arrows | |
| '\u{219a}'..'\u{219b}' // [↚..↛] Arrows | |
| '\u{21a0}' // [↠] Arrows | |
| '\u{21a3}' // [↣] Arrows | |
| '\u{21a6}' // [↦] Arrows | |
| '\u{21ae}' // [↮] Arrows | |
| '\u{21ce}'..'\u{21cf}' // [⇎..⇏] Arrows | |
| '\u{21d2}' // [⇒] Arrows | |
| '\u{21d4}' // [⇔] Arrows | |
| '\u{21f4}'..'\u{22ff}' // [⇴..⋿] Arrows | |
| '\u{2320}'..'\u{2321}' // [⌠..⌡] Miscellaneous Technical | |
| '\u{237c}' // [⍼] Miscellaneous Technical | |
| '\u{239b}'..'\u{23b3}' // [⎛..⎳] Miscellaneous Technical | |
| '\u{23dc}'..'\u{23e1}' // [⏜..⏡] Miscellaneous Technical | |
| '\u{25b7}' // [▷] Geometric Shapes | |
| '\u{25c1}' // [◁] Geometric Shapes | |
| '\u{25f8}'..'\u{25ff}' // [◸..◿] Geometric Shapes | |
| '\u{266f}' // [♯] Miscellaneous Symbols | |
| '\u{27c0}'..'\u{27c4}' // [⟀..⟄] Miscellaneous Mathematical Symbols-A | |
| '\u{27c7}'..'\u{27e5}' // [⟇..⟥] Miscellaneous Mathematical Symbols-A | |
| '\u{27f0}'..'\u{27ff}' // [⟰..⟿] Supplemental Arrows-A | |
| '\u{2900}'..'\u{2982}' // [⤀..⦂] Supplemental Arrows-B | |
| '\u{2999}'..'\u{29d7}' // [⦙..⧗] Miscellaneous Mathematical Symbols-B | |
| '\u{29dc}'..'\u{29fb}' // [⧜..⧻] Miscellaneous Mathematical Symbols-B | |
| '\u{29fe}'..'\u{2aff}' // [⧾..⫿] Miscellaneous Mathematical Symbols-B | |
| '\u{2b30}'..'\u{2b44}' // [⬰..⭄] Miscellaneous Symbols and Arrows | |
| '\u{2b47}'..'\u{2b4c}' // [⭇..⭌] Miscellaneous Symbols and Arrows | |
| '\u{fb29}' // [﬩] Alphabetic Presentation Forms | |
| '\u{fe62}' // [﹢] Small Form Variants | |
| '\u{fe64}'..'\u{fe66}' // [﹤..﹦] Small Form Variants | |
| '\u{ff0b}' // [+] Halfwidth and Fullwidth Forms | |
| '\u{ff1c}'..'\u{ff1e}' // [<..>] Halfwidth and Fullwidth Forms | |
| '\u{ff5c}' // [|] Halfwidth and Fullwidth Forms | |
| '\u{ff5e}' // [~] Halfwidth and Fullwidth Forms | |
| '\u{ffe2}' // [¬] Halfwidth and Fullwidth Forms | |
| '\u{ffe9}'..'\u{ffec}' // [←..↓] Halfwidth and Fullwidth Forms | |
| '\u{1d6c1}' // [𝛁] Mathematical Alphanumeric Symbols | |
| '\u{1d6db}' // [𝛛] Mathematical Alphanumeric Symbols | |
| '\u{1d6fb}' // [𝛻] Mathematical Alphanumeric Symbols | |
| '\u{1d715}' // [𝜕] Mathematical Alphanumeric Symbols | |
| '\u{1d735}' // [𝜵] Mathematical Alphanumeric Symbols | |
| '\u{1d74f}' // [𝝏] Mathematical Alphanumeric Symbols | |
| '\u{1d76f}' // [𝝯] Mathematical Alphanumeric Symbols | |
| '\u{1d789}' // [𝞉] Mathematical Alphanumeric Symbols | |
| '\u{1d7a9}' // [𝞩] Mathematical Alphanumeric Symbols | |
| '\u{1d7c3}' // [𝟃] Mathematical Alphanumeric Symbols | |
| '\u{1eef0}'..'\u{1eef1}' // [𞻰..𞻱] Arabic Mathematical Alphabetic Symbols | |
; | |
CLASSIFY_So: // Other_Symbol | |
'\u{00a6}' // [¦] Latin-1 Supplement | |
| '\u{00a9}' // [©] Latin-1 Supplement | |
| '\u{00ae}' // [®] Latin-1 Supplement | |
| '\u{00b0}' // [°] Latin-1 Supplement | |
| '\u{0482}' // [҂] Cyrillic | |
| '\u{058d}'..'\u{058e}' // [֍..֎] Armenian | |
| '\u{060e}'..'\u{060f}' // [؎..؏] Arabic | |
| '\u{06de}' // [۞] Arabic | |
| '\u{06e9}' // [۩] Arabic | |
| '\u{06fd}'..'\u{06fe}' // [۽..۾] Arabic | |
| '\u{07f6}' // [߶] NKo | |
| '\u{09fa}' // [৺] Bengali | |
| '\u{0b70}' // [୰] Oriya | |
| '\u{0bf3}'..'\u{0bf8}' // [௳..௸] Tamil | |
| '\u{0bfa}' // [௺] Tamil | |
| '\u{0c7f}' // [౿] Telugu | |
| '\u{0d4f}' // [൏] Malayalam | |
| '\u{0d79}' // [൹] Malayalam | |
| '\u{0f01}'..'\u{0f03}' // [༁..༃] Tibetan | |
| '\u{0f13}' // [༓] Tibetan | |
| '\u{0f15}'..'\u{0f17}' // [༕..༗] Tibetan | |
| '\u{0f1a}'..'\u{0f1f}' // [༚..༟] Tibetan | |
| '\u{0f34}' // [༴] Tibetan | |
| '\u{0f36}' // [༶] Tibetan | |
| '\u{0f38}' // [༸] Tibetan | |
| '\u{0fbe}'..'\u{0fc5}' // [྾..࿅] Tibetan | |
| '\u{0fc7}'..'\u{0fcf}' // [࿇..࿏] Tibetan | |
| '\u{0fd5}'..'\u{0fd8}' // [࿕..࿘] Tibetan | |
| '\u{109e}'..'\u{109f}' // [႞..႟] Myanmar | |
| '\u{1390}'..'\u{1399}' // [᎐..᎙] Ethiopic Supplement | |
| '\u{1940}' // [᥀] Limbu | |
| '\u{19de}'..'\u{19ff}' // [᧞..᧿] New Tai Lue | |
| '\u{1b61}'..'\u{1b6a}' // [᭡..᭪] Balinese | |
| '\u{1b74}'..'\u{1b7c}' // [᭴..᭼] Balinese | |
| '\u{2100}'..'\u{2101}' // [℀..℁] Letterlike Symbols | |
| '\u{2103}'..'\u{2106}' // [℃..℆] Letterlike Symbols | |
| '\u{2108}'..'\u{2109}' // [℈..℉] Letterlike Symbols | |
| '\u{2114}' // [℔] Letterlike Symbols | |
| '\u{2116}'..'\u{2117}' // [№..℗] Letterlike Symbols | |
| '\u{211e}'..'\u{2123}' // [℞..℣] Letterlike Symbols | |
| '\u{2125}' // [℥] Letterlike Symbols | |
| '\u{2127}' // [℧] Letterlike Symbols | |
| '\u{2129}' // [℩] Letterlike Symbols | |
| '\u{212e}' // [℮] Letterlike Symbols | |
| '\u{213a}'..'\u{213b}' // [℺..℻] Letterlike Symbols | |
| '\u{214a}' // [⅊] Letterlike Symbols | |
| '\u{214c}'..'\u{214d}' // [⅌..⅍] Letterlike Symbols | |
| '\u{214f}' // [⅏] Letterlike Symbols | |
| '\u{218a}'..'\u{218b}' // [↊..↋] Number Forms | |
| '\u{2195}'..'\u{2199}' // [↕..↙] Arrows | |
| '\u{219c}'..'\u{219f}' // [↜..↟] Arrows | |
| '\u{21a1}'..'\u{21a2}' // [↡..↢] Arrows | |
| '\u{21a4}'..'\u{21a5}' // [↤..↥] Arrows | |
| '\u{21a7}'..'\u{21ad}' // [↧..↭] Arrows | |
| '\u{21af}'..'\u{21cd}' // [↯..⇍] Arrows | |
| '\u{21d0}'..'\u{21d1}' // [⇐..⇑] Arrows | |
| '\u{21d3}' // [⇓] Arrows | |
| '\u{21d5}'..'\u{21f3}' // [⇕..⇳] Arrows | |
| '\u{2300}'..'\u{2307}' // [⌀..⌇] Miscellaneous Technical | |
| '\u{230c}'..'\u{231f}' // [⌌..⌟] Miscellaneous Technical | |
| '\u{2322}'..'\u{2328}' // [⌢..⌨] Miscellaneous Technical | |
| '\u{232b}'..'\u{237b}' // [⌫..⍻] Miscellaneous Technical | |
| '\u{237d}'..'\u{239a}' // [⍽..⎚] Miscellaneous Technical | |
| '\u{23b4}'..'\u{23db}' // [⎴..⏛] Miscellaneous Technical | |
| '\u{23e2}'..'\u{244a}' // [⏢..⑊] Miscellaneous Technical | |
| '\u{249c}'..'\u{24e9}' // [⒜..ⓩ] Enclosed Alphanumerics | |
| '\u{2500}'..'\u{25b6}' // [─..▶] Box Drawing | |
| '\u{25b8}'..'\u{25c0}' // [▸..◀] Geometric Shapes | |
| '\u{25c2}'..'\u{25f7}' // [◂..◷] Geometric Shapes | |
| '\u{2600}'..'\u{266e}' // [☀..♮] Miscellaneous Symbols | |
| '\u{2670}'..'\u{2767}' // [♰..❧] Miscellaneous Symbols | |
| '\u{2794}'..'\u{27bf}' // [➔..➿] Dingbats | |
| '\u{2800}'..'\u{28ff}' // [⠀..⣿] Braille Patterns | |
| '\u{2b00}'..'\u{2b2f}' // [⬀..⬯] Miscellaneous Symbols and Arrows | |
| '\u{2b45}'..'\u{2b46}' // [⭅..⭆] Miscellaneous Symbols and Arrows | |
| '\u{2b4d}'..'\u{2bef}' // [⭍..⯯] Miscellaneous Symbols and Arrows | |
| '\u{2ce5}'..'\u{2cea}' // [⳥..⳪] Coptic | |
| '\u{2e80}'..'\u{2ffb}' // [⺀..⿻] CJK Radicals Supplement | |
| '\u{3004}' // [〄] CJK Symbols and Punctuation | |
| '\u{3012}'..'\u{3013}' // [〒..〓] CJK Symbols and Punctuation | |
| '\u{3020}' // [〠] CJK Symbols and Punctuation | |
| '\u{3036}'..'\u{3037}' // [〶..〷] CJK Symbols and Punctuation | |
| '\u{303e}'..'\u{303f}' // [〾..〿] CJK Symbols and Punctuation | |
| '\u{3190}'..'\u{3191}' // [㆐..㆑] Kanbun | |
| '\u{3196}'..'\u{319f}' // [㆖..㆟] Kanbun | |
| '\u{31c0}'..'\u{31e3}' // [㇀..㇣] CJK Strokes | |
| '\u{3200}'..'\u{321e}' // [㈀..㈞] Enclosed CJK Letters and Months | |
| '\u{322a}'..'\u{3247}' // [㈪..㉇] Enclosed CJK Letters and Months | |
| '\u{3250}' // [㉐] Enclosed CJK Letters and Months | |
| '\u{3260}'..'\u{327f}' // [㉠..㉿] Enclosed CJK Letters and Months | |
| '\u{328a}'..'\u{32b0}' // [㊊..㊰] Enclosed CJK Letters and Months | |
| '\u{32c0}'..'\u{33ff}' // [㋀..㏿] Enclosed CJK Letters and Months | |
| '\u{4dc0}'..'\u{4dff}' // [䷀..䷿] Yijing Hexagram Symbols | |
| '\u{a490}'..'\u{a4c6}' // [꒐..꓆] Yi Radicals | |
| '\u{a828}'..'\u{a82b}' // [꠨..꠫] Syloti Nagri | |
| '\u{a836}'..'\u{a837}' // [꠶..꠷] Common Indic Number Forms | |
| '\u{a839}' // [꠹] Common Indic Number Forms | |
| '\u{aa77}'..'\u{aa79}' // [꩷..꩹] Myanmar Extended-A | |
| '\u{fdfd}' // [﷽] Arabic Presentation Forms-A | |
| '\u{ffe4}' // [¦] Halfwidth and Fullwidth Forms | |
| '\u{ffe8}' // [│] Halfwidth and Fullwidth Forms | |
| '\u{ffed}'..'\u{ffee}' // [■..○] Halfwidth and Fullwidth Forms | |
| '\u{fffc}'..'\u{fffd}' // [..�] Specials | |
| '\u{10137}'..'\u{1013f}' // [𐄷..𐄿] Aegean Numbers | |
| '\u{10179}'..'\u{10189}' // [𐅹..𐆉] Ancient Greek Numbers | |
| '\u{1018c}'..'\u{101fc}' // [𐆌..𐇼] Ancient Greek Numbers | |
| '\u{10877}'..'\u{10878}' // [𐡷..𐡸] Palmyrene | |
| '\u{10ac8}' // [𐫈] Manichaean | |
| '\u{1173f}' // [𑜿] Ahom | |
| '\u{16b3c}'..'\u{16b3f}' // [𖬼..𖬿] Pahawh Hmong | |
| '\u{16b45}' // [𖭅] Pahawh Hmong | |
| '\u{1bc9c}' // [𛲜] Duployan | |
| '\u{1d000}'..'\u{1d164}' // [𝀀..𝅘𝅥𝅲] Byzantine Musical Symbols | |
| '\u{1d16a}'..'\u{1d16c}' // [𝅪..𝅬] Musical Symbols | |
| '\u{1d183}'..'\u{1d184}' // [𝆃..𝆄] Musical Symbols | |
| '\u{1d18c}'..'\u{1d1a9}' // [𝆌..𝆩] Musical Symbols | |
| '\u{1d1ae}'..'\u{1d241}' // [𝆮..𝉁] Musical Symbols | |
| '\u{1d245}'..'\u{1d356}' // [𝉅..𝍖] Ancient Greek Musical Notation | |
| '\u{1d800}'..'\u{1d9ff}' // [𝠀..𝧿] Sutton SignWriting | |
| '\u{1da37}'..'\u{1da3a}' // [𝨷..𝨺] Sutton SignWriting | |
| '\u{1da6d}'..'\u{1da74}' // [𝩭..𝩴] Sutton SignWriting | |
| '\u{1da76}'..'\u{1da83}' // [𝩶..𝪃] Sutton SignWriting | |
| '\u{1da85}'..'\u{1da86}' // [𝪅..𝪆] Sutton SignWriting | |
| '\u{1f000}'..'\u{1f0f5}' // [🀀..🃵] Mahjong Tiles | |
| '\u{1f110}'..'\u{1f3fa}' // [🄐..🏺] Enclosed Alphanumeric Supplement | |
| '\u{1f400}'..'\u{1f9c0}' // [🐀..🧀] Miscellaneous Symbols and Pictographs | |
; | |
CLASSIFY_Zl: // Line_Separator | |
'\u{2028}' // [ ] General Punctuation | |
; | |
CLASSIFY_Zp: // Paragraph_Separator | |
'\u{2029}' // [ ] General Punctuation | |
; | |
CLASSIFY_Zs: // Space_Separator | |
'\u{0020}' // [ ] Basic Latin | |
| '\u{00a0}' // [ ] Latin-1 Supplement | |
| '\u{1680}' // [ ] Ogham | |
| '\u{2000}'..'\u{200a}' // [ .. ] General Punctuation | |
| '\u{202f}' // [ ] General Punctuation | |
| '\u{205f}' // [ ] General Punctuation | |
| '\u{3000}' // [ ] CJK Symbols and Punctuation | |
; | |
CLASSIFY_C : | |
CLASSIFY_Cc | |
| CLASSIFY_Cf | |
| CLASSIFY_Co | |
| CLASSIFY_Cs // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_LC : | |
CLASSIFY_Ll | |
| CLASSIFY_Lt | |
| CLASSIFY_Lu // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_M : | |
CLASSIFY_Mc | |
| CLASSIFY_Me | |
| CLASSIFY_Mn // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_L : | |
CLASSIFY_Ll | |
| CLASSIFY_Lm | |
| CLASSIFY_Lo | |
| CLASSIFY_Lt | |
| CLASSIFY_Lu // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_N : | |
CLASSIFY_Nd | |
| CLASSIFY_Nl | |
| CLASSIFY_No // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_P : | |
CLASSIFY_Pc | |
| CLASSIFY_Pd | |
| CLASSIFY_Pe | |
| CLASSIFY_Pf | |
| CLASSIFY_Pi | |
| CLASSIFY_Po | |
| CLASSIFY_Ps // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_S : | |
CLASSIFY_Sc | |
| CLASSIFY_Sk | |
| CLASSIFY_Sm | |
| CLASSIFY_So // from local/PropertyValueAliases.txt | |
; | |
CLASSIFY_Z : | |
CLASSIFY_Zl | |
| CLASSIFY_Zp | |
| CLASSIFY_Zs // from local/PropertyValueAliases.txt | |
; | |
/* End of Unicode codepoint classification */ | |
CLASSIFY_WS : CLASSIFY_Z + // hand-written rule | |
; | |
CLASSIFY_ID0 : CLASSIFY_L | '_' // hand-written rule | |
; | |
CLASSIFY_ID1 : CLASSIFY_ID0 | CLASSIFY_N // hand-written rule | |
; | |
ID : CLASSIFY_ID0 CLASSIFY_ID1 * // hand-written rule | |
; |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment
@bhamiltoncx can you reconsider the license for classify21.g4 (maybe make it MIT or BSD)? It's a pain that I have to duplicate all the work that lead to it in a non-GPL environment. At the end we would have a very similar grammar, since the actual code points are the same.