Created
December 2, 2015 13:01
-
-
Save agopaul/dc533229ff5c2b6c52dd to your computer and use it in GitHub Desktop.
Unicode Character Ranges
This file contains hidden or bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
| <?php | |
| $chars = array ( | |
| array ( | |
| "unicodeCodePointBegin" => "0020", | |
| "utf8Begin" => "\x20", | |
| "unicodeCodePointEnd" => "007F", | |
| "utf8End" => "\x7f", | |
| "name" => "Basic Latin", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2580", | |
| "utf8Begin" => "\xe2\x96\x80", | |
| "unicodeCodePointEnd" => "259F", | |
| "utf8End" => "\xe2\x96\x9f", | |
| "name" => "Block Elements", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "00A0", | |
| "utf8Begin" => "\xc2\xa0", | |
| "unicodeCodePointEnd" => "00FF", | |
| "utf8End" => "\xc3\xbf", | |
| "name" => "Latin-1 Supplement", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "25A0", | |
| "utf8Begin" => "\xe2\x96\xa0", | |
| "unicodeCodePointEnd" => "25FF", | |
| "utf8End" => "\xe2\x97\xbf", | |
| "name" => "Geometric Shapes", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0100", | |
| "utf8Begin" => "\xc4\x80", | |
| "unicodeCodePointEnd" => "017F", | |
| "utf8End" => "\xc5\xbf", | |
| "name" => "Latin Extended-A", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2600", | |
| "utf8Begin" => "\xe2\x98\x80", | |
| "unicodeCodePointEnd" => "26FF", | |
| "utf8End" => "\xe2\x9b\xbf", | |
| "name" => "Miscellaneous Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0180", | |
| "utf8Begin" => "\xc6\x80", | |
| "unicodeCodePointEnd" => "024F", | |
| "utf8End" => "\xc9\x8f", | |
| "name" => "Latin Extended-B", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2700", | |
| "utf8Begin" => "\xe2\x9c\x80", | |
| "unicodeCodePointEnd" => "27BF", | |
| "utf8End" => "\xe2\x9e\xbf", | |
| "name" => "Dingbats", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0250", | |
| "utf8Begin" => "\xc9\x90", | |
| "unicodeCodePointEnd" => "02AF", | |
| "utf8End" => "\xca\xaf", | |
| "name" => "IPA Extensions", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "27C0", | |
| "utf8Begin" => "\xe2\x9f\x80", | |
| "unicodeCodePointEnd" => "27EF", | |
| "utf8End" => "\xe2\x9f\xaf", | |
| "name" => "Miscellaneous Mathematical Symbols-A", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "02B0", | |
| "utf8Begin" => "\xca\xb0", | |
| "unicodeCodePointEnd" => "02FF", | |
| "utf8End" => "\xcb\xbf", | |
| "name" => "Spacing Modifier Letters", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "27F0", | |
| "utf8Begin" => "\xe2\x9f\xb0", | |
| "unicodeCodePointEnd" => "27FF", | |
| "utf8End" => "\xe2\x9f\xbf", | |
| "name" => "Supplemental Arrows-A", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0300", | |
| "utf8Begin" => "\xcc\x80", | |
| "unicodeCodePointEnd" => "036F", | |
| "utf8End" => "\xcd\xaf", | |
| "name" => "Combining Diacritical Marks", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2800", | |
| "utf8Begin" => "\xe2\xa0\x80", | |
| "unicodeCodePointEnd" => "28FF", | |
| "utf8End" => "\xe2\xa3\xbf", | |
| "name" => "Braille Patterns", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0370", | |
| "utf8Begin" => "\xcd\xb0", | |
| "unicodeCodePointEnd" => "03FF", | |
| "utf8End" => "\xcf\xbf", | |
| "name" => "Greek and Coptic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2900", | |
| "utf8Begin" => "\xe2\xa4\x80", | |
| "unicodeCodePointEnd" => "297F", | |
| "utf8End" => "\xe2\xa5\xbf", | |
| "name" => "Supplemental Arrows-B", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0400", | |
| "utf8Begin" => "\xd0\x80", | |
| "unicodeCodePointEnd" => "04FF", | |
| "utf8End" => "\xd3\xbf", | |
| "name" => "Cyrillic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2980", | |
| "utf8Begin" => "\xe2\xa6\x80", | |
| "unicodeCodePointEnd" => "29FF", | |
| "utf8End" => "\xe2\xa7\xbf", | |
| "name" => "Miscellaneous Mathematical Symbols-B", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0500", | |
| "utf8Begin" => "\xd4\x80", | |
| "unicodeCodePointEnd" => "052F", | |
| "utf8End" => "\xd4\xaf", | |
| "name" => "Cyrillic Supplementary", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2A00", | |
| "utf8Begin" => "\xe2\xa8\x80", | |
| "unicodeCodePointEnd" => "2AFF", | |
| "utf8End" => "\xe2\xab\xbf", | |
| "name" => "Supplemental Mathematical Operators", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0530", | |
| "utf8Begin" => "\xd4\xb0", | |
| "unicodeCodePointEnd" => "058F", | |
| "utf8End" => "\xd6\x8f", | |
| "name" => "Armenian", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2B00", | |
| "utf8Begin" => "\xe2\xac\x80", | |
| "unicodeCodePointEnd" => "2BFF", | |
| "utf8End" => "\xe2\xaf\xbf", | |
| "name" => "Miscellaneous Symbols and Arrows", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0590", | |
| "utf8Begin" => "\xd6\x90", | |
| "unicodeCodePointEnd" => "05FF", | |
| "utf8End" => "\xd7\xbf", | |
| "name" => "Hebrew", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2E80", | |
| "utf8Begin" => "\xe2\xba\x80", | |
| "unicodeCodePointEnd" => "2EFF", | |
| "utf8End" => "\xe2\xbb\xbf", | |
| "name" => "CJK Radicals Supplement", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0600", | |
| "utf8Begin" => "\xd8\x80", | |
| "unicodeCodePointEnd" => "06FF", | |
| "utf8End" => "\xdb\xbf", | |
| "name" => "Arabic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2F00", | |
| "utf8Begin" => "\xe2\xbc\x80", | |
| "unicodeCodePointEnd" => "2FDF", | |
| "utf8End" => "\xe2\xbf\x9f", | |
| "name" => "Kangxi Radicals", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0700", | |
| "utf8Begin" => "\xdc\x80", | |
| "unicodeCodePointEnd" => "074F", | |
| "utf8End" => "\xdd\x8f", | |
| "name" => "Syriac", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2FF0", | |
| "utf8Begin" => "\xe2\xbf\xb0", | |
| "unicodeCodePointEnd" => "2FFF", | |
| "utf8End" => "\xe2\xbf\xbf", | |
| "name" => "Ideographic Description Characters", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0780", | |
| "utf8Begin" => "\xde\x80", | |
| "unicodeCodePointEnd" => "07BF", | |
| "utf8End" => "\xde\xbf", | |
| "name" => "Thaana", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3000", | |
| "utf8Begin" => "\xe3\x80\x80", | |
| "unicodeCodePointEnd" => "303F", | |
| "utf8End" => "\xe3\x80\xbf", | |
| "name" => "CJK Symbols and Punctuation", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0900", | |
| "utf8Begin" => "\xe0\xa4\x80", | |
| "unicodeCodePointEnd" => "097F", | |
| "utf8End" => "\xe0\xa5\xbf", | |
| "name" => "Devanagari", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3040", | |
| "utf8Begin" => "\xe3\x81\x80", | |
| "unicodeCodePointEnd" => "309F", | |
| "utf8End" => "\xe3\x82\x9f", | |
| "name" => "Hiragana", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0980", | |
| "utf8Begin" => "\xe0\xa6\x80", | |
| "unicodeCodePointEnd" => "09FF", | |
| "utf8End" => "\xe0\xa7\xbf", | |
| "name" => "Bengali", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "30A0", | |
| "utf8Begin" => "\xe3\x82\xa0", | |
| "unicodeCodePointEnd" => "30FF", | |
| "utf8End" => "\xe3\x83\xbf", | |
| "name" => "Katakana", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0A00", | |
| "utf8Begin" => "\xe0\xa8\x80", | |
| "unicodeCodePointEnd" => "0A7F", | |
| "utf8End" => "\xe0\xa9\xbf", | |
| "name" => "Gurmukhi", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3100", | |
| "utf8Begin" => "\xe3\x84\x80", | |
| "unicodeCodePointEnd" => "312F", | |
| "utf8End" => "\xe3\x84\xaf", | |
| "name" => "Bopomofo", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0A80", | |
| "utf8Begin" => "\xe0\xaa\x80", | |
| "unicodeCodePointEnd" => "0AFF", | |
| "utf8End" => "\xe0\xab\xbf", | |
| "name" => "Gujarati", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3130", | |
| "utf8Begin" => "\xe3\x84\xb0", | |
| "unicodeCodePointEnd" => "318F", | |
| "utf8End" => "\xe3\x86\x8f", | |
| "name" => "Hangul Compatibility Jamo", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0B00", | |
| "utf8Begin" => "\xe0\xac\x80", | |
| "unicodeCodePointEnd" => "0B7F", | |
| "utf8End" => "\xe0\xad\xbf", | |
| "name" => "Oriya", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3190", | |
| "utf8Begin" => "\xe3\x86\x90", | |
| "unicodeCodePointEnd" => "319F", | |
| "utf8End" => "\xe3\x86\x9f", | |
| "name" => "Kanbun", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0B80", | |
| "utf8Begin" => "\xe0\xae\x80", | |
| "unicodeCodePointEnd" => "0BFF", | |
| "utf8End" => "\xe0\xaf\xbf", | |
| "name" => "Tamil", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "31A0", | |
| "utf8Begin" => "\xe3\x86\xa0", | |
| "unicodeCodePointEnd" => "31BF", | |
| "utf8End" => "\xe3\x86\xbf", | |
| "name" => "Bopomofo Extended", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0C00", | |
| "utf8Begin" => "\xe0\xb0\x80", | |
| "unicodeCodePointEnd" => "0C7F", | |
| "utf8End" => "\xe0\xb1\xbf", | |
| "name" => "Telugu", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "31F0", | |
| "utf8Begin" => "\xe3\x87\xb0", | |
| "unicodeCodePointEnd" => "31FF", | |
| "utf8End" => "\xe3\x87\xbf", | |
| "name" => "Katakana Phonetic Extensions", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0C80", | |
| "utf8Begin" => "\xe0\xb2\x80", | |
| "unicodeCodePointEnd" => "0CFF", | |
| "utf8End" => "\xe0\xb3\xbf", | |
| "name" => "Kannada", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3200", | |
| "utf8Begin" => "\xe3\x88\x80", | |
| "unicodeCodePointEnd" => "32FF", | |
| "utf8End" => "\xe3\x8b\xbf", | |
| "name" => "Enclosed CJK Letters and Months", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0D00", | |
| "utf8Begin" => "\xe0\xb4\x80", | |
| "unicodeCodePointEnd" => "0D7F", | |
| "utf8End" => "\xe0\xb5\xbf", | |
| "name" => "Malayalam", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3300", | |
| "utf8Begin" => "\xe3\x8c\x80", | |
| "unicodeCodePointEnd" => "33FF", | |
| "utf8End" => "\xe3\x8f\xbf", | |
| "name" => "CJK Compatibility", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0D80", | |
| "utf8Begin" => "\xe0\xb6\x80", | |
| "unicodeCodePointEnd" => "0DFF", | |
| "utf8End" => "\xe0\xb7\xbf", | |
| "name" => "Sinhala", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "3400", | |
| "utf8Begin" => "\xe3\x90\x80", | |
| "unicodeCodePointEnd" => "4DBF", | |
| "utf8End" => "\xe4\xb6\xbf", | |
| "name" => "CJK Unified Ideographs Extension A", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0E00", | |
| "utf8Begin" => "\xe0\xb8\x80", | |
| "unicodeCodePointEnd" => "0E7F", | |
| "utf8End" => "\xe0\xb9\xbf", | |
| "name" => "Thai", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "4DC0", | |
| "utf8Begin" => "\xe4\xb7\x80", | |
| "unicodeCodePointEnd" => "4DFF", | |
| "utf8End" => "\xe4\xb7\xbf", | |
| "name" => "Yijing Hexagram Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0E80", | |
| "utf8Begin" => "\xe0\xba\x80", | |
| "unicodeCodePointEnd" => "0EFF", | |
| "utf8End" => "\xe0\xbb\xbf", | |
| "name" => "Lao", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "4E00", | |
| "utf8Begin" => "\xe4\xb8\x80", | |
| "unicodeCodePointEnd" => "9FFF", | |
| "utf8End" => "\xe9\xbf\xbf", | |
| "name" => "CJK Unified Ideographs", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "0F00", | |
| "utf8Begin" => "\xe0\xbc\x80", | |
| "unicodeCodePointEnd" => "0FFF", | |
| "utf8End" => "\xe0\xbf\xbf", | |
| "name" => "Tibetan", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "A000", | |
| "utf8Begin" => "\xea\x80\x80", | |
| "unicodeCodePointEnd" => "A48F", | |
| "utf8End" => "\xea\x92\x8f", | |
| "name" => "Yi Syllables", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1000", | |
| "utf8Begin" => "\xe1\x80\x80", | |
| "unicodeCodePointEnd" => "109F", | |
| "utf8End" => "\xe1\x82\x9f", | |
| "name" => "Myanmar", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "A490", | |
| "utf8Begin" => "\xea\x92\x90", | |
| "unicodeCodePointEnd" => "A4CF", | |
| "utf8End" => "\xea\x93\x8f", | |
| "name" => "Yi Radicals", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10A0", | |
| "utf8Begin" => "\xe1\x82\xa0", | |
| "unicodeCodePointEnd" => "10FF", | |
| "utf8End" => "\xe1\x83\xbf", | |
| "name" => "Georgian", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "AC00", | |
| "utf8Begin" => "\xea\xb0\x80", | |
| "unicodeCodePointEnd" => "D7AF", | |
| "utf8End" => "\xed\x9e\xaf", | |
| "name" => "Hangul Syllables", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1100", | |
| "utf8Begin" => "\xe1\x84\x80", | |
| "unicodeCodePointEnd" => "11FF", | |
| "utf8End" => "\xe1\x87\xbf", | |
| "name" => "Hangul Jamo", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "D800", | |
| "utf8Begin" => "\xed\xa0\x80", | |
| "unicodeCodePointEnd" => "DB7F", | |
| "utf8End" => "\xed\xad\xbf", | |
| "name" => "High Surrogates", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1200", | |
| "utf8Begin" => "\xe1\x88\x80", | |
| "unicodeCodePointEnd" => "137F", | |
| "utf8End" => "\xe1\x8d\xbf", | |
| "name" => "Ethiopic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "DB80", | |
| "utf8Begin" => "\xed\xae\x80", | |
| "unicodeCodePointEnd" => "DBFF", | |
| "utf8End" => "\xed\xaf\xbf", | |
| "name" => "High Private Use Surrogates", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "13A0", | |
| "utf8Begin" => "\xe1\x8e\xa0", | |
| "unicodeCodePointEnd" => "13FF", | |
| "utf8End" => "\xe1\x8f\xbf", | |
| "name" => "Cherokee", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "DC00", | |
| "utf8Begin" => "\xed\xb0\x80", | |
| "unicodeCodePointEnd" => "DFFF", | |
| "utf8End" => "\xed\xbf\xbf", | |
| "name" => "Low Surrogates", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1400", | |
| "utf8Begin" => "\xe1\x90\x80", | |
| "unicodeCodePointEnd" => "167F", | |
| "utf8End" => "\xe1\x99\xbf", | |
| "name" => "Unified Canadian Aboriginal Syllabics", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "E000", | |
| "utf8Begin" => "\xee\x80\x80", | |
| "unicodeCodePointEnd" => "F8FF", | |
| "utf8End" => "\xef\xa3\xbf", | |
| "name" => "Private Use Area", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1680", | |
| "utf8Begin" => "\xe1\x9a\x80", | |
| "unicodeCodePointEnd" => "169F", | |
| "utf8End" => "\xe1\x9a\x9f", | |
| "name" => "Ogham", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "F900", | |
| "utf8Begin" => "\xef\xa4\x80", | |
| "unicodeCodePointEnd" => "FAFF", | |
| "utf8End" => "\xef\xab\xbf", | |
| "name" => "CJK Compatibility Ideographs", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "16A0", | |
| "utf8Begin" => "\xe1\x9a\xa0", | |
| "unicodeCodePointEnd" => "16FF", | |
| "utf8End" => "\xe1\x9b\xbf", | |
| "name" => "Runic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FB00", | |
| "utf8Begin" => "\xef\xac\x80", | |
| "unicodeCodePointEnd" => "FB4F", | |
| "utf8End" => "\xef\xad\x8f", | |
| "name" => "Alphabetic Presentation Forms", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1700", | |
| "utf8Begin" => "\xe1\x9c\x80", | |
| "unicodeCodePointEnd" => "171F", | |
| "utf8End" => "\xe1\x9c\x9f", | |
| "name" => "Tagalog", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FB50", | |
| "utf8Begin" => "\xef\xad\x90", | |
| "unicodeCodePointEnd" => "FDFF", | |
| "utf8End" => "\xef\xb7\xbf", | |
| "name" => "Arabic Presentation Forms-A", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1720", | |
| "utf8Begin" => "\xe1\x9c\xa0", | |
| "unicodeCodePointEnd" => "173F", | |
| "utf8End" => "\xe1\x9c\xbf", | |
| "name" => "Hanunoo", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FE00", | |
| "utf8Begin" => "\xef\xb8\x80", | |
| "unicodeCodePointEnd" => "FE0F", | |
| "utf8End" => "\xef\xb8\x8f", | |
| "name" => "Variation Selectors", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1740", | |
| "utf8Begin" => "\xe1\x9d\x80", | |
| "unicodeCodePointEnd" => "175F", | |
| "utf8End" => "\xe1\x9d\x9f", | |
| "name" => "Buhid", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FE20", | |
| "utf8Begin" => "\xef\xb8\xa0", | |
| "unicodeCodePointEnd" => "FE2F", | |
| "utf8End" => "\xef\xb8\xaf", | |
| "name" => "Combining Half Marks", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1760", | |
| "utf8Begin" => "\xe1\x9d\xa0", | |
| "unicodeCodePointEnd" => "177F", | |
| "utf8End" => "\xe1\x9d\xbf", | |
| "name" => "Tagbanwa", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FE30", | |
| "utf8Begin" => "\xef\xb8\xb0", | |
| "unicodeCodePointEnd" => "FE4F", | |
| "utf8End" => "\xef\xb9\x8f", | |
| "name" => "CJK Compatibility Forms", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1780", | |
| "utf8Begin" => "\xe1\x9e\x80", | |
| "unicodeCodePointEnd" => "17FF", | |
| "utf8End" => "\xe1\x9f\xbf", | |
| "name" => "Khmer", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FE50", | |
| "utf8Begin" => "\xef\xb9\x90", | |
| "unicodeCodePointEnd" => "FE6F", | |
| "utf8End" => "\xef\xb9\xaf", | |
| "name" => "Small Form Variants", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1800", | |
| "utf8Begin" => "\xe1\xa0\x80", | |
| "unicodeCodePointEnd" => "18AF", | |
| "utf8End" => "\xe1\xa2\xaf", | |
| "name" => "Mongolian", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FE70", | |
| "utf8Begin" => "\xef\xb9\xb0", | |
| "unicodeCodePointEnd" => "FEFF", | |
| "utf8End" => "\xef\xbb\xbf", | |
| "name" => "Arabic Presentation Forms-B", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1900", | |
| "utf8Begin" => "\xe1\xa4\x80", | |
| "unicodeCodePointEnd" => "194F", | |
| "utf8End" => "\xe1\xa5\x8f", | |
| "name" => "Limbu", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FF00", | |
| "utf8Begin" => "\xef\xbc\x80", | |
| "unicodeCodePointEnd" => "FFEF", | |
| "utf8End" => "\xef\xbf\xaf", | |
| "name" => "Halfwidth and Fullwidth Forms", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1950", | |
| "utf8Begin" => "\xe1\xa5\x90", | |
| "unicodeCodePointEnd" => "197F", | |
| "utf8End" => "\xe1\xa5\xbf", | |
| "name" => "Tai Le", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "FFF0", | |
| "utf8Begin" => "\xef\xbf\xb0", | |
| "unicodeCodePointEnd" => "FFFF", | |
| "utf8End" => "\xef\xbf\xbf", | |
| "name" => "Specials", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "19E0", | |
| "utf8Begin" => "\xe1\xa7\xa0", | |
| "unicodeCodePointEnd" => "19FF", | |
| "utf8End" => "\xe1\xa7\xbf", | |
| "name" => "Khmer Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10000", | |
| "utf8Begin" => "\xf0\x90\x80\x80", | |
| "unicodeCodePointEnd" => "1007F", | |
| "utf8End" => "\xf0\x90\x81\xbf", | |
| "name" => "Linear B Syllabary", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1D00", | |
| "utf8Begin" => "\xe1\xb4\x80", | |
| "unicodeCodePointEnd" => "1D7F", | |
| "utf8End" => "\xe1\xb5\xbf", | |
| "name" => "Phonetic Extensions", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10080", | |
| "utf8Begin" => "\xf0\x90\x82\x80", | |
| "unicodeCodePointEnd" => "100FF", | |
| "utf8End" => "\xf0\x90\x83\xbf", | |
| "name" => "Linear B Ideograms", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1E00", | |
| "utf8Begin" => "\xe1\xb8\x80", | |
| "unicodeCodePointEnd" => "1EFF", | |
| "utf8End" => "\xe1\xbb\xbf", | |
| "name" => "Latin Extended Additional", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10100", | |
| "utf8Begin" => "\xf0\x90\x84\x80", | |
| "unicodeCodePointEnd" => "1013F", | |
| "utf8End" => "\xf0\x90\x84\xbf", | |
| "name" => "Aegean Numbers", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1F00", | |
| "utf8Begin" => "\xe1\xbc\x80", | |
| "unicodeCodePointEnd" => "1FFF", | |
| "utf8End" => "\xe1\xbf\xbf", | |
| "name" => "Greek Extended", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10300", | |
| "utf8Begin" => "\xf0\x90\x8c\x80", | |
| "unicodeCodePointEnd" => "1032F", | |
| "utf8End" => "\xf0\x90\x8c\xaf", | |
| "name" => "Old Italic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2000", | |
| "utf8Begin" => "\xe2\x80\x80", | |
| "unicodeCodePointEnd" => "206F", | |
| "utf8End" => "\xe2\x81\xaf", | |
| "name" => "General Punctuation", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10330", | |
| "utf8Begin" => "\xf0\x90\x8c\xb0", | |
| "unicodeCodePointEnd" => "1034F", | |
| "utf8End" => "\xf0\x90\x8d\x8f", | |
| "name" => "Gothic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2070", | |
| "utf8Begin" => "\xe2\x81\xb0", | |
| "unicodeCodePointEnd" => "209F", | |
| "utf8End" => "\xe2\x82\x9f", | |
| "name" => "Superscripts and Subscripts", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10380", | |
| "utf8Begin" => "\xf0\x90\x8e\x80", | |
| "unicodeCodePointEnd" => "1039F", | |
| "utf8End" => "\xf0\x90\x8e\x9f", | |
| "name" => "Ugaritic", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "20A0", | |
| "utf8Begin" => "\xe2\x82\xa0", | |
| "unicodeCodePointEnd" => "20CF", | |
| "utf8End" => "\xe2\x83\x8f", | |
| "name" => "Currency Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10400", | |
| "utf8Begin" => "\xf0\x90\x90\x80", | |
| "unicodeCodePointEnd" => "1044F", | |
| "utf8End" => "\xf0\x90\x91\x8f", | |
| "name" => "Deseret", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "20D0", | |
| "utf8Begin" => "\xe2\x83\x90", | |
| "unicodeCodePointEnd" => "20FF", | |
| "utf8End" => "\xe2\x83\xbf", | |
| "name" => "Combining Diacritical Marks for Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10450", | |
| "utf8Begin" => "\xf0\x90\x91\x90", | |
| "unicodeCodePointEnd" => "1047F", | |
| "utf8End" => "\xf0\x90\x91\xbf", | |
| "name" => "Shavian", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2100", | |
| "utf8Begin" => "\xe2\x84\x80", | |
| "unicodeCodePointEnd" => "214F", | |
| "utf8End" => "\xe2\x85\x8f", | |
| "name" => "Letterlike Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10480", | |
| "utf8Begin" => "\xf0\x90\x92\x80", | |
| "unicodeCodePointEnd" => "104AF", | |
| "utf8End" => "\xf0\x90\x92\xaf", | |
| "name" => "Osmanya", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2150", | |
| "utf8Begin" => "\xe2\x85\x90", | |
| "unicodeCodePointEnd" => "218F", | |
| "utf8End" => "\xe2\x86\x8f", | |
| "name" => "Number Forms", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "10800", | |
| "utf8Begin" => "\xf0\x90\xa0\x80", | |
| "unicodeCodePointEnd" => "1083F", | |
| "utf8End" => "\xf0\x90\xa0\xbf", | |
| "name" => "Cypriot Syllabary", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2190", | |
| "utf8Begin" => "\xe2\x86\x90", | |
| "unicodeCodePointEnd" => "21FF", | |
| "utf8End" => "\xe2\x87\xbf", | |
| "name" => "Arrows", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1D000", | |
| "utf8Begin" => "\xf0\x9d\x80\x80", | |
| "unicodeCodePointEnd" => "1D0FF", | |
| "utf8End" => "\xf0\x9d\x83\xbf", | |
| "name" => "Byzantine Musical Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2200", | |
| "utf8Begin" => "\xe2\x88\x80", | |
| "unicodeCodePointEnd" => "22FF", | |
| "utf8End" => "\xe2\x8b\xbf", | |
| "name" => "Mathematical Operators", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1D100", | |
| "utf8Begin" => "\xf0\x9d\x84\x80", | |
| "unicodeCodePointEnd" => "1D1FF", | |
| "utf8End" => "\xf0\x9d\x87\xbf", | |
| "name" => "Musical Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2300", | |
| "utf8Begin" => "\xe2\x8c\x80", | |
| "unicodeCodePointEnd" => "23FF", | |
| "utf8End" => "\xe2\x8f\xbf", | |
| "name" => "Miscellaneous Technical", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1D300", | |
| "utf8Begin" => "\xf0\x9d\x8c\x80", | |
| "unicodeCodePointEnd" => "1D35F", | |
| "utf8End" => "\xf0\x9d\x8d\x9f", | |
| "name" => "Tai Xuan Jing Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2400", | |
| "utf8Begin" => "\xe2\x90\x80", | |
| "unicodeCodePointEnd" => "243F", | |
| "utf8End" => "\xe2\x90\xbf", | |
| "name" => "Control Pictures", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "1D400", | |
| "utf8Begin" => "\xf0\x9d\x90\x80", | |
| "unicodeCodePointEnd" => "1D7FF", | |
| "utf8End" => "\xf0\x9d\x9f\xbf", | |
| "name" => "Mathematical Alphanumeric Symbols", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2440", | |
| "utf8Begin" => "\xe2\x91\x80", | |
| "unicodeCodePointEnd" => "245F", | |
| "utf8End" => "\xe2\x91\x9f", | |
| "name" => "Optical Character Recognition", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "20000", | |
| "utf8Begin" => "\xf0\xa0\x80\x80", | |
| "unicodeCodePointEnd" => "2A6DF", | |
| "utf8End" => "\xf0\xaa\x9b\x9f", | |
| "name" => "CJK Unified Ideographs Extension B", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2460", | |
| "utf8Begin" => "\xe2\x91\xa0", | |
| "unicodeCodePointEnd" => "24FF", | |
| "utf8End" => "\xe2\x93\xbf", | |
| "name" => "Enclosed Alphanumerics", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2F800", | |
| "utf8Begin" => "\xf0\xaf\xa0\x80", | |
| "unicodeCodePointEnd" => "2FA1F", | |
| "utf8End" => "\xf0\xaf\xa8\x9f", | |
| "name" => "CJK Compatibility Ideographs Supplement", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "2500", | |
| "utf8Begin" => "\xe2\x94\x80", | |
| "unicodeCodePointEnd" => "257F", | |
| "utf8End" => "\xe2\x95\xbf", | |
| "name" => "Box Drawing", | |
| ), | |
| array ( | |
| "unicodeCodePointBegin" => "E0000", | |
| "utf8Begin" => "\xf3\xa0\x80\x80", | |
| "unicodeCodePointEnd" => "E007F", | |
| "utf8End" => "\xf3\xa0\x81\xbf", | |
| "name" => "Tags", | |
| ), | |
| ); |
Sign up for free
to join this conversation on GitHub.
Already have an account?
Sign in to comment