Skip to content

Instantly share code, notes, and snippets.

@agopaul
Created December 2, 2015 13:01
Show Gist options
  • Select an option

  • Save agopaul/dc533229ff5c2b6c52dd to your computer and use it in GitHub Desktop.

Select an option

Save agopaul/dc533229ff5c2b6c52dd to your computer and use it in GitHub Desktop.
Unicode Character Ranges
<?php
$chars = array (
array (
"unicodeCodePointBegin" => "0020",
"utf8Begin" => "\x20",
"unicodeCodePointEnd" => "007F",
"utf8End" => "\x7f",
"name" => "Basic Latin",
),
array (
"unicodeCodePointBegin" => "2580",
"utf8Begin" => "\xe2\x96\x80",
"unicodeCodePointEnd" => "259F",
"utf8End" => "\xe2\x96\x9f",
"name" => "Block Elements",
),
array (
"unicodeCodePointBegin" => "00A0",
"utf8Begin" => "\xc2\xa0",
"unicodeCodePointEnd" => "00FF",
"utf8End" => "\xc3\xbf",
"name" => "Latin-1 Supplement",
),
array (
"unicodeCodePointBegin" => "25A0",
"utf8Begin" => "\xe2\x96\xa0",
"unicodeCodePointEnd" => "25FF",
"utf8End" => "\xe2\x97\xbf",
"name" => "Geometric Shapes",
),
array (
"unicodeCodePointBegin" => "0100",
"utf8Begin" => "\xc4\x80",
"unicodeCodePointEnd" => "017F",
"utf8End" => "\xc5\xbf",
"name" => "Latin Extended-A",
),
array (
"unicodeCodePointBegin" => "2600",
"utf8Begin" => "\xe2\x98\x80",
"unicodeCodePointEnd" => "26FF",
"utf8End" => "\xe2\x9b\xbf",
"name" => "Miscellaneous Symbols",
),
array (
"unicodeCodePointBegin" => "0180",
"utf8Begin" => "\xc6\x80",
"unicodeCodePointEnd" => "024F",
"utf8End" => "\xc9\x8f",
"name" => "Latin Extended-B",
),
array (
"unicodeCodePointBegin" => "2700",
"utf8Begin" => "\xe2\x9c\x80",
"unicodeCodePointEnd" => "27BF",
"utf8End" => "\xe2\x9e\xbf",
"name" => "Dingbats",
),
array (
"unicodeCodePointBegin" => "0250",
"utf8Begin" => "\xc9\x90",
"unicodeCodePointEnd" => "02AF",
"utf8End" => "\xca\xaf",
"name" => "IPA Extensions",
),
array (
"unicodeCodePointBegin" => "27C0",
"utf8Begin" => "\xe2\x9f\x80",
"unicodeCodePointEnd" => "27EF",
"utf8End" => "\xe2\x9f\xaf",
"name" => "Miscellaneous Mathematical Symbols-A",
),
array (
"unicodeCodePointBegin" => "02B0",
"utf8Begin" => "\xca\xb0",
"unicodeCodePointEnd" => "02FF",
"utf8End" => "\xcb\xbf",
"name" => "Spacing Modifier Letters",
),
array (
"unicodeCodePointBegin" => "27F0",
"utf8Begin" => "\xe2\x9f\xb0",
"unicodeCodePointEnd" => "27FF",
"utf8End" => "\xe2\x9f\xbf",
"name" => "Supplemental Arrows-A",
),
array (
"unicodeCodePointBegin" => "0300",
"utf8Begin" => "\xcc\x80",
"unicodeCodePointEnd" => "036F",
"utf8End" => "\xcd\xaf",
"name" => "Combining Diacritical Marks",
),
array (
"unicodeCodePointBegin" => "2800",
"utf8Begin" => "\xe2\xa0\x80",
"unicodeCodePointEnd" => "28FF",
"utf8End" => "\xe2\xa3\xbf",
"name" => "Braille Patterns",
),
array (
"unicodeCodePointBegin" => "0370",
"utf8Begin" => "\xcd\xb0",
"unicodeCodePointEnd" => "03FF",
"utf8End" => "\xcf\xbf",
"name" => "Greek and Coptic",
),
array (
"unicodeCodePointBegin" => "2900",
"utf8Begin" => "\xe2\xa4\x80",
"unicodeCodePointEnd" => "297F",
"utf8End" => "\xe2\xa5\xbf",
"name" => "Supplemental Arrows-B",
),
array (
"unicodeCodePointBegin" => "0400",
"utf8Begin" => "\xd0\x80",
"unicodeCodePointEnd" => "04FF",
"utf8End" => "\xd3\xbf",
"name" => "Cyrillic",
),
array (
"unicodeCodePointBegin" => "2980",
"utf8Begin" => "\xe2\xa6\x80",
"unicodeCodePointEnd" => "29FF",
"utf8End" => "\xe2\xa7\xbf",
"name" => "Miscellaneous Mathematical Symbols-B",
),
array (
"unicodeCodePointBegin" => "0500",
"utf8Begin" => "\xd4\x80",
"unicodeCodePointEnd" => "052F",
"utf8End" => "\xd4\xaf",
"name" => "Cyrillic Supplementary",
),
array (
"unicodeCodePointBegin" => "2A00",
"utf8Begin" => "\xe2\xa8\x80",
"unicodeCodePointEnd" => "2AFF",
"utf8End" => "\xe2\xab\xbf",
"name" => "Supplemental Mathematical Operators",
),
array (
"unicodeCodePointBegin" => "0530",
"utf8Begin" => "\xd4\xb0",
"unicodeCodePointEnd" => "058F",
"utf8End" => "\xd6\x8f",
"name" => "Armenian",
),
array (
"unicodeCodePointBegin" => "2B00",
"utf8Begin" => "\xe2\xac\x80",
"unicodeCodePointEnd" => "2BFF",
"utf8End" => "\xe2\xaf\xbf",
"name" => "Miscellaneous Symbols and Arrows",
),
array (
"unicodeCodePointBegin" => "0590",
"utf8Begin" => "\xd6\x90",
"unicodeCodePointEnd" => "05FF",
"utf8End" => "\xd7\xbf",
"name" => "Hebrew",
),
array (
"unicodeCodePointBegin" => "2E80",
"utf8Begin" => "\xe2\xba\x80",
"unicodeCodePointEnd" => "2EFF",
"utf8End" => "\xe2\xbb\xbf",
"name" => "CJK Radicals Supplement",
),
array (
"unicodeCodePointBegin" => "0600",
"utf8Begin" => "\xd8\x80",
"unicodeCodePointEnd" => "06FF",
"utf8End" => "\xdb\xbf",
"name" => "Arabic",
),
array (
"unicodeCodePointBegin" => "2F00",
"utf8Begin" => "\xe2\xbc\x80",
"unicodeCodePointEnd" => "2FDF",
"utf8End" => "\xe2\xbf\x9f",
"name" => "Kangxi Radicals",
),
array (
"unicodeCodePointBegin" => "0700",
"utf8Begin" => "\xdc\x80",
"unicodeCodePointEnd" => "074F",
"utf8End" => "\xdd\x8f",
"name" => "Syriac",
),
array (
"unicodeCodePointBegin" => "2FF0",
"utf8Begin" => "\xe2\xbf\xb0",
"unicodeCodePointEnd" => "2FFF",
"utf8End" => "\xe2\xbf\xbf",
"name" => "Ideographic Description Characters",
),
array (
"unicodeCodePointBegin" => "0780",
"utf8Begin" => "\xde\x80",
"unicodeCodePointEnd" => "07BF",
"utf8End" => "\xde\xbf",
"name" => "Thaana",
),
array (
"unicodeCodePointBegin" => "3000",
"utf8Begin" => "\xe3\x80\x80",
"unicodeCodePointEnd" => "303F",
"utf8End" => "\xe3\x80\xbf",
"name" => "CJK Symbols and Punctuation",
),
array (
"unicodeCodePointBegin" => "0900",
"utf8Begin" => "\xe0\xa4\x80",
"unicodeCodePointEnd" => "097F",
"utf8End" => "\xe0\xa5\xbf",
"name" => "Devanagari",
),
array (
"unicodeCodePointBegin" => "3040",
"utf8Begin" => "\xe3\x81\x80",
"unicodeCodePointEnd" => "309F",
"utf8End" => "\xe3\x82\x9f",
"name" => "Hiragana",
),
array (
"unicodeCodePointBegin" => "0980",
"utf8Begin" => "\xe0\xa6\x80",
"unicodeCodePointEnd" => "09FF",
"utf8End" => "\xe0\xa7\xbf",
"name" => "Bengali",
),
array (
"unicodeCodePointBegin" => "30A0",
"utf8Begin" => "\xe3\x82\xa0",
"unicodeCodePointEnd" => "30FF",
"utf8End" => "\xe3\x83\xbf",
"name" => "Katakana",
),
array (
"unicodeCodePointBegin" => "0A00",
"utf8Begin" => "\xe0\xa8\x80",
"unicodeCodePointEnd" => "0A7F",
"utf8End" => "\xe0\xa9\xbf",
"name" => "Gurmukhi",
),
array (
"unicodeCodePointBegin" => "3100",
"utf8Begin" => "\xe3\x84\x80",
"unicodeCodePointEnd" => "312F",
"utf8End" => "\xe3\x84\xaf",
"name" => "Bopomofo",
),
array (
"unicodeCodePointBegin" => "0A80",
"utf8Begin" => "\xe0\xaa\x80",
"unicodeCodePointEnd" => "0AFF",
"utf8End" => "\xe0\xab\xbf",
"name" => "Gujarati",
),
array (
"unicodeCodePointBegin" => "3130",
"utf8Begin" => "\xe3\x84\xb0",
"unicodeCodePointEnd" => "318F",
"utf8End" => "\xe3\x86\x8f",
"name" => "Hangul Compatibility Jamo",
),
array (
"unicodeCodePointBegin" => "0B00",
"utf8Begin" => "\xe0\xac\x80",
"unicodeCodePointEnd" => "0B7F",
"utf8End" => "\xe0\xad\xbf",
"name" => "Oriya",
),
array (
"unicodeCodePointBegin" => "3190",
"utf8Begin" => "\xe3\x86\x90",
"unicodeCodePointEnd" => "319F",
"utf8End" => "\xe3\x86\x9f",
"name" => "Kanbun",
),
array (
"unicodeCodePointBegin" => "0B80",
"utf8Begin" => "\xe0\xae\x80",
"unicodeCodePointEnd" => "0BFF",
"utf8End" => "\xe0\xaf\xbf",
"name" => "Tamil",
),
array (
"unicodeCodePointBegin" => "31A0",
"utf8Begin" => "\xe3\x86\xa0",
"unicodeCodePointEnd" => "31BF",
"utf8End" => "\xe3\x86\xbf",
"name" => "Bopomofo Extended",
),
array (
"unicodeCodePointBegin" => "0C00",
"utf8Begin" => "\xe0\xb0\x80",
"unicodeCodePointEnd" => "0C7F",
"utf8End" => "\xe0\xb1\xbf",
"name" => "Telugu",
),
array (
"unicodeCodePointBegin" => "31F0",
"utf8Begin" => "\xe3\x87\xb0",
"unicodeCodePointEnd" => "31FF",
"utf8End" => "\xe3\x87\xbf",
"name" => "Katakana Phonetic Extensions",
),
array (
"unicodeCodePointBegin" => "0C80",
"utf8Begin" => "\xe0\xb2\x80",
"unicodeCodePointEnd" => "0CFF",
"utf8End" => "\xe0\xb3\xbf",
"name" => "Kannada",
),
array (
"unicodeCodePointBegin" => "3200",
"utf8Begin" => "\xe3\x88\x80",
"unicodeCodePointEnd" => "32FF",
"utf8End" => "\xe3\x8b\xbf",
"name" => "Enclosed CJK Letters and Months",
),
array (
"unicodeCodePointBegin" => "0D00",
"utf8Begin" => "\xe0\xb4\x80",
"unicodeCodePointEnd" => "0D7F",
"utf8End" => "\xe0\xb5\xbf",
"name" => "Malayalam",
),
array (
"unicodeCodePointBegin" => "3300",
"utf8Begin" => "\xe3\x8c\x80",
"unicodeCodePointEnd" => "33FF",
"utf8End" => "\xe3\x8f\xbf",
"name" => "CJK Compatibility",
),
array (
"unicodeCodePointBegin" => "0D80",
"utf8Begin" => "\xe0\xb6\x80",
"unicodeCodePointEnd" => "0DFF",
"utf8End" => "\xe0\xb7\xbf",
"name" => "Sinhala",
),
array (
"unicodeCodePointBegin" => "3400",
"utf8Begin" => "\xe3\x90\x80",
"unicodeCodePointEnd" => "4DBF",
"utf8End" => "\xe4\xb6\xbf",
"name" => "CJK Unified Ideographs Extension A",
),
array (
"unicodeCodePointBegin" => "0E00",
"utf8Begin" => "\xe0\xb8\x80",
"unicodeCodePointEnd" => "0E7F",
"utf8End" => "\xe0\xb9\xbf",
"name" => "Thai",
),
array (
"unicodeCodePointBegin" => "4DC0",
"utf8Begin" => "\xe4\xb7\x80",
"unicodeCodePointEnd" => "4DFF",
"utf8End" => "\xe4\xb7\xbf",
"name" => "Yijing Hexagram Symbols",
),
array (
"unicodeCodePointBegin" => "0E80",
"utf8Begin" => "\xe0\xba\x80",
"unicodeCodePointEnd" => "0EFF",
"utf8End" => "\xe0\xbb\xbf",
"name" => "Lao",
),
array (
"unicodeCodePointBegin" => "4E00",
"utf8Begin" => "\xe4\xb8\x80",
"unicodeCodePointEnd" => "9FFF",
"utf8End" => "\xe9\xbf\xbf",
"name" => "CJK Unified Ideographs",
),
array (
"unicodeCodePointBegin" => "0F00",
"utf8Begin" => "\xe0\xbc\x80",
"unicodeCodePointEnd" => "0FFF",
"utf8End" => "\xe0\xbf\xbf",
"name" => "Tibetan",
),
array (
"unicodeCodePointBegin" => "A000",
"utf8Begin" => "\xea\x80\x80",
"unicodeCodePointEnd" => "A48F",
"utf8End" => "\xea\x92\x8f",
"name" => "Yi Syllables",
),
array (
"unicodeCodePointBegin" => "1000",
"utf8Begin" => "\xe1\x80\x80",
"unicodeCodePointEnd" => "109F",
"utf8End" => "\xe1\x82\x9f",
"name" => "Myanmar",
),
array (
"unicodeCodePointBegin" => "A490",
"utf8Begin" => "\xea\x92\x90",
"unicodeCodePointEnd" => "A4CF",
"utf8End" => "\xea\x93\x8f",
"name" => "Yi Radicals",
),
array (
"unicodeCodePointBegin" => "10A0",
"utf8Begin" => "\xe1\x82\xa0",
"unicodeCodePointEnd" => "10FF",
"utf8End" => "\xe1\x83\xbf",
"name" => "Georgian",
),
array (
"unicodeCodePointBegin" => "AC00",
"utf8Begin" => "\xea\xb0\x80",
"unicodeCodePointEnd" => "D7AF",
"utf8End" => "\xed\x9e\xaf",
"name" => "Hangul Syllables",
),
array (
"unicodeCodePointBegin" => "1100",
"utf8Begin" => "\xe1\x84\x80",
"unicodeCodePointEnd" => "11FF",
"utf8End" => "\xe1\x87\xbf",
"name" => "Hangul Jamo",
),
array (
"unicodeCodePointBegin" => "D800",
"utf8Begin" => "\xed\xa0\x80",
"unicodeCodePointEnd" => "DB7F",
"utf8End" => "\xed\xad\xbf",
"name" => "High Surrogates",
),
array (
"unicodeCodePointBegin" => "1200",
"utf8Begin" => "\xe1\x88\x80",
"unicodeCodePointEnd" => "137F",
"utf8End" => "\xe1\x8d\xbf",
"name" => "Ethiopic",
),
array (
"unicodeCodePointBegin" => "DB80",
"utf8Begin" => "\xed\xae\x80",
"unicodeCodePointEnd" => "DBFF",
"utf8End" => "\xed\xaf\xbf",
"name" => "High Private Use Surrogates",
),
array (
"unicodeCodePointBegin" => "13A0",
"utf8Begin" => "\xe1\x8e\xa0",
"unicodeCodePointEnd" => "13FF",
"utf8End" => "\xe1\x8f\xbf",
"name" => "Cherokee",
),
array (
"unicodeCodePointBegin" => "DC00",
"utf8Begin" => "\xed\xb0\x80",
"unicodeCodePointEnd" => "DFFF",
"utf8End" => "\xed\xbf\xbf",
"name" => "Low Surrogates",
),
array (
"unicodeCodePointBegin" => "1400",
"utf8Begin" => "\xe1\x90\x80",
"unicodeCodePointEnd" => "167F",
"utf8End" => "\xe1\x99\xbf",
"name" => "Unified Canadian Aboriginal Syllabics",
),
array (
"unicodeCodePointBegin" => "E000",
"utf8Begin" => "\xee\x80\x80",
"unicodeCodePointEnd" => "F8FF",
"utf8End" => "\xef\xa3\xbf",
"name" => "Private Use Area",
),
array (
"unicodeCodePointBegin" => "1680",
"utf8Begin" => "\xe1\x9a\x80",
"unicodeCodePointEnd" => "169F",
"utf8End" => "\xe1\x9a\x9f",
"name" => "Ogham",
),
array (
"unicodeCodePointBegin" => "F900",
"utf8Begin" => "\xef\xa4\x80",
"unicodeCodePointEnd" => "FAFF",
"utf8End" => "\xef\xab\xbf",
"name" => "CJK Compatibility Ideographs",
),
array (
"unicodeCodePointBegin" => "16A0",
"utf8Begin" => "\xe1\x9a\xa0",
"unicodeCodePointEnd" => "16FF",
"utf8End" => "\xe1\x9b\xbf",
"name" => "Runic",
),
array (
"unicodeCodePointBegin" => "FB00",
"utf8Begin" => "\xef\xac\x80",
"unicodeCodePointEnd" => "FB4F",
"utf8End" => "\xef\xad\x8f",
"name" => "Alphabetic Presentation Forms",
),
array (
"unicodeCodePointBegin" => "1700",
"utf8Begin" => "\xe1\x9c\x80",
"unicodeCodePointEnd" => "171F",
"utf8End" => "\xe1\x9c\x9f",
"name" => "Tagalog",
),
array (
"unicodeCodePointBegin" => "FB50",
"utf8Begin" => "\xef\xad\x90",
"unicodeCodePointEnd" => "FDFF",
"utf8End" => "\xef\xb7\xbf",
"name" => "Arabic Presentation Forms-A",
),
array (
"unicodeCodePointBegin" => "1720",
"utf8Begin" => "\xe1\x9c\xa0",
"unicodeCodePointEnd" => "173F",
"utf8End" => "\xe1\x9c\xbf",
"name" => "Hanunoo",
),
array (
"unicodeCodePointBegin" => "FE00",
"utf8Begin" => "\xef\xb8\x80",
"unicodeCodePointEnd" => "FE0F",
"utf8End" => "\xef\xb8\x8f",
"name" => "Variation Selectors",
),
array (
"unicodeCodePointBegin" => "1740",
"utf8Begin" => "\xe1\x9d\x80",
"unicodeCodePointEnd" => "175F",
"utf8End" => "\xe1\x9d\x9f",
"name" => "Buhid",
),
array (
"unicodeCodePointBegin" => "FE20",
"utf8Begin" => "\xef\xb8\xa0",
"unicodeCodePointEnd" => "FE2F",
"utf8End" => "\xef\xb8\xaf",
"name" => "Combining Half Marks",
),
array (
"unicodeCodePointBegin" => "1760",
"utf8Begin" => "\xe1\x9d\xa0",
"unicodeCodePointEnd" => "177F",
"utf8End" => "\xe1\x9d\xbf",
"name" => "Tagbanwa",
),
array (
"unicodeCodePointBegin" => "FE30",
"utf8Begin" => "\xef\xb8\xb0",
"unicodeCodePointEnd" => "FE4F",
"utf8End" => "\xef\xb9\x8f",
"name" => "CJK Compatibility Forms",
),
array (
"unicodeCodePointBegin" => "1780",
"utf8Begin" => "\xe1\x9e\x80",
"unicodeCodePointEnd" => "17FF",
"utf8End" => "\xe1\x9f\xbf",
"name" => "Khmer",
),
array (
"unicodeCodePointBegin" => "FE50",
"utf8Begin" => "\xef\xb9\x90",
"unicodeCodePointEnd" => "FE6F",
"utf8End" => "\xef\xb9\xaf",
"name" => "Small Form Variants",
),
array (
"unicodeCodePointBegin" => "1800",
"utf8Begin" => "\xe1\xa0\x80",
"unicodeCodePointEnd" => "18AF",
"utf8End" => "\xe1\xa2\xaf",
"name" => "Mongolian",
),
array (
"unicodeCodePointBegin" => "FE70",
"utf8Begin" => "\xef\xb9\xb0",
"unicodeCodePointEnd" => "FEFF",
"utf8End" => "\xef\xbb\xbf",
"name" => "Arabic Presentation Forms-B",
),
array (
"unicodeCodePointBegin" => "1900",
"utf8Begin" => "\xe1\xa4\x80",
"unicodeCodePointEnd" => "194F",
"utf8End" => "\xe1\xa5\x8f",
"name" => "Limbu",
),
array (
"unicodeCodePointBegin" => "FF00",
"utf8Begin" => "\xef\xbc\x80",
"unicodeCodePointEnd" => "FFEF",
"utf8End" => "\xef\xbf\xaf",
"name" => "Halfwidth and Fullwidth Forms",
),
array (
"unicodeCodePointBegin" => "1950",
"utf8Begin" => "\xe1\xa5\x90",
"unicodeCodePointEnd" => "197F",
"utf8End" => "\xe1\xa5\xbf",
"name" => "Tai Le",
),
array (
"unicodeCodePointBegin" => "FFF0",
"utf8Begin" => "\xef\xbf\xb0",
"unicodeCodePointEnd" => "FFFF",
"utf8End" => "\xef\xbf\xbf",
"name" => "Specials",
),
array (
"unicodeCodePointBegin" => "19E0",
"utf8Begin" => "\xe1\xa7\xa0",
"unicodeCodePointEnd" => "19FF",
"utf8End" => "\xe1\xa7\xbf",
"name" => "Khmer Symbols",
),
array (
"unicodeCodePointBegin" => "10000",
"utf8Begin" => "\xf0\x90\x80\x80",
"unicodeCodePointEnd" => "1007F",
"utf8End" => "\xf0\x90\x81\xbf",
"name" => "Linear B Syllabary",
),
array (
"unicodeCodePointBegin" => "1D00",
"utf8Begin" => "\xe1\xb4\x80",
"unicodeCodePointEnd" => "1D7F",
"utf8End" => "\xe1\xb5\xbf",
"name" => "Phonetic Extensions",
),
array (
"unicodeCodePointBegin" => "10080",
"utf8Begin" => "\xf0\x90\x82\x80",
"unicodeCodePointEnd" => "100FF",
"utf8End" => "\xf0\x90\x83\xbf",
"name" => "Linear B Ideograms",
),
array (
"unicodeCodePointBegin" => "1E00",
"utf8Begin" => "\xe1\xb8\x80",
"unicodeCodePointEnd" => "1EFF",
"utf8End" => "\xe1\xbb\xbf",
"name" => "Latin Extended Additional",
),
array (
"unicodeCodePointBegin" => "10100",
"utf8Begin" => "\xf0\x90\x84\x80",
"unicodeCodePointEnd" => "1013F",
"utf8End" => "\xf0\x90\x84\xbf",
"name" => "Aegean Numbers",
),
array (
"unicodeCodePointBegin" => "1F00",
"utf8Begin" => "\xe1\xbc\x80",
"unicodeCodePointEnd" => "1FFF",
"utf8End" => "\xe1\xbf\xbf",
"name" => "Greek Extended",
),
array (
"unicodeCodePointBegin" => "10300",
"utf8Begin" => "\xf0\x90\x8c\x80",
"unicodeCodePointEnd" => "1032F",
"utf8End" => "\xf0\x90\x8c\xaf",
"name" => "Old Italic",
),
array (
"unicodeCodePointBegin" => "2000",
"utf8Begin" => "\xe2\x80\x80",
"unicodeCodePointEnd" => "206F",
"utf8End" => "\xe2\x81\xaf",
"name" => "General Punctuation",
),
array (
"unicodeCodePointBegin" => "10330",
"utf8Begin" => "\xf0\x90\x8c\xb0",
"unicodeCodePointEnd" => "1034F",
"utf8End" => "\xf0\x90\x8d\x8f",
"name" => "Gothic",
),
array (
"unicodeCodePointBegin" => "2070",
"utf8Begin" => "\xe2\x81\xb0",
"unicodeCodePointEnd" => "209F",
"utf8End" => "\xe2\x82\x9f",
"name" => "Superscripts and Subscripts",
),
array (
"unicodeCodePointBegin" => "10380",
"utf8Begin" => "\xf0\x90\x8e\x80",
"unicodeCodePointEnd" => "1039F",
"utf8End" => "\xf0\x90\x8e\x9f",
"name" => "Ugaritic",
),
array (
"unicodeCodePointBegin" => "20A0",
"utf8Begin" => "\xe2\x82\xa0",
"unicodeCodePointEnd" => "20CF",
"utf8End" => "\xe2\x83\x8f",
"name" => "Currency Symbols",
),
array (
"unicodeCodePointBegin" => "10400",
"utf8Begin" => "\xf0\x90\x90\x80",
"unicodeCodePointEnd" => "1044F",
"utf8End" => "\xf0\x90\x91\x8f",
"name" => "Deseret",
),
array (
"unicodeCodePointBegin" => "20D0",
"utf8Begin" => "\xe2\x83\x90",
"unicodeCodePointEnd" => "20FF",
"utf8End" => "\xe2\x83\xbf",
"name" => "Combining Diacritical Marks for Symbols",
),
array (
"unicodeCodePointBegin" => "10450",
"utf8Begin" => "\xf0\x90\x91\x90",
"unicodeCodePointEnd" => "1047F",
"utf8End" => "\xf0\x90\x91\xbf",
"name" => "Shavian",
),
array (
"unicodeCodePointBegin" => "2100",
"utf8Begin" => "\xe2\x84\x80",
"unicodeCodePointEnd" => "214F",
"utf8End" => "\xe2\x85\x8f",
"name" => "Letterlike Symbols",
),
array (
"unicodeCodePointBegin" => "10480",
"utf8Begin" => "\xf0\x90\x92\x80",
"unicodeCodePointEnd" => "104AF",
"utf8End" => "\xf0\x90\x92\xaf",
"name" => "Osmanya",
),
array (
"unicodeCodePointBegin" => "2150",
"utf8Begin" => "\xe2\x85\x90",
"unicodeCodePointEnd" => "218F",
"utf8End" => "\xe2\x86\x8f",
"name" => "Number Forms",
),
array (
"unicodeCodePointBegin" => "10800",
"utf8Begin" => "\xf0\x90\xa0\x80",
"unicodeCodePointEnd" => "1083F",
"utf8End" => "\xf0\x90\xa0\xbf",
"name" => "Cypriot Syllabary",
),
array (
"unicodeCodePointBegin" => "2190",
"utf8Begin" => "\xe2\x86\x90",
"unicodeCodePointEnd" => "21FF",
"utf8End" => "\xe2\x87\xbf",
"name" => "Arrows",
),
array (
"unicodeCodePointBegin" => "1D000",
"utf8Begin" => "\xf0\x9d\x80\x80",
"unicodeCodePointEnd" => "1D0FF",
"utf8End" => "\xf0\x9d\x83\xbf",
"name" => "Byzantine Musical Symbols",
),
array (
"unicodeCodePointBegin" => "2200",
"utf8Begin" => "\xe2\x88\x80",
"unicodeCodePointEnd" => "22FF",
"utf8End" => "\xe2\x8b\xbf",
"name" => "Mathematical Operators",
),
array (
"unicodeCodePointBegin" => "1D100",
"utf8Begin" => "\xf0\x9d\x84\x80",
"unicodeCodePointEnd" => "1D1FF",
"utf8End" => "\xf0\x9d\x87\xbf",
"name" => "Musical Symbols",
),
array (
"unicodeCodePointBegin" => "2300",
"utf8Begin" => "\xe2\x8c\x80",
"unicodeCodePointEnd" => "23FF",
"utf8End" => "\xe2\x8f\xbf",
"name" => "Miscellaneous Technical",
),
array (
"unicodeCodePointBegin" => "1D300",
"utf8Begin" => "\xf0\x9d\x8c\x80",
"unicodeCodePointEnd" => "1D35F",
"utf8End" => "\xf0\x9d\x8d\x9f",
"name" => "Tai Xuan Jing Symbols",
),
array (
"unicodeCodePointBegin" => "2400",
"utf8Begin" => "\xe2\x90\x80",
"unicodeCodePointEnd" => "243F",
"utf8End" => "\xe2\x90\xbf",
"name" => "Control Pictures",
),
array (
"unicodeCodePointBegin" => "1D400",
"utf8Begin" => "\xf0\x9d\x90\x80",
"unicodeCodePointEnd" => "1D7FF",
"utf8End" => "\xf0\x9d\x9f\xbf",
"name" => "Mathematical Alphanumeric Symbols",
),
array (
"unicodeCodePointBegin" => "2440",
"utf8Begin" => "\xe2\x91\x80",
"unicodeCodePointEnd" => "245F",
"utf8End" => "\xe2\x91\x9f",
"name" => "Optical Character Recognition",
),
array (
"unicodeCodePointBegin" => "20000",
"utf8Begin" => "\xf0\xa0\x80\x80",
"unicodeCodePointEnd" => "2A6DF",
"utf8End" => "\xf0\xaa\x9b\x9f",
"name" => "CJK Unified Ideographs Extension B",
),
array (
"unicodeCodePointBegin" => "2460",
"utf8Begin" => "\xe2\x91\xa0",
"unicodeCodePointEnd" => "24FF",
"utf8End" => "\xe2\x93\xbf",
"name" => "Enclosed Alphanumerics",
),
array (
"unicodeCodePointBegin" => "2F800",
"utf8Begin" => "\xf0\xaf\xa0\x80",
"unicodeCodePointEnd" => "2FA1F",
"utf8End" => "\xf0\xaf\xa8\x9f",
"name" => "CJK Compatibility Ideographs Supplement",
),
array (
"unicodeCodePointBegin" => "2500",
"utf8Begin" => "\xe2\x94\x80",
"unicodeCodePointEnd" => "257F",
"utf8End" => "\xe2\x95\xbf",
"name" => "Box Drawing",
),
array (
"unicodeCodePointBegin" => "E0000",
"utf8Begin" => "\xf3\xa0\x80\x80",
"unicodeCodePointEnd" => "E007F",
"utf8End" => "\xf3\xa0\x81\xbf",
"name" => "Tags",
),
);
Sign up for free to join this conversation on GitHub. Already have an account? Sign in to comment