The Unicode Range and Viewer

本文详细介绍了Unicode标准中定义的各种字符范围及其对应的字符集,包括基本拉丁字母、希腊字母、阿拉伯文、汉字等,并提供了每个范围的起始和结束代码点。

http://www.russellcottrell.com/greek/utilities/UnicodeRanges.htm

typedef struct
{
  uint32_t FristCode;
  uint32_t LastCode;
  uint8_t * Description;
} UNICODE_RANGE_T;

const UNICODE_RANGE_T UnicodeRange[ ] =
{
{ 0x0000, 0x007F, "Basic Latin" },
{ 0x0080, 0x00FF, "Latin, 0x1 Supplement" },
{ 0x0100, 0x017F, "Latin Extended, 0xA" },
{ 0x0180, 0x024F, "Latin Extended, 0xB" },
{ 0x0250, 0x02AF, "IPA Extensions" },
{ 0x02B0, 0x02FF, "Spacing Modifier Letters" },
{ 0x0300, 0x036F, "Combining Diacritical Marks" },
{ 0x0370, 0x03FF, "Greek and Coptic" },
{ 0x0400, 0x04FF, "Cyrillic" },
{ 0x0500, 0x052F, "Cyrillic Supplementary" },
{ 0x0530, 0x058F, "Armenian" },
{ 0x0590, 0x05FF, "Hebrew" },
{ 0x0600, 0x06FF, "Arabic" },
{ 0x0700, 0x074F, "Syriac" },
{ 0x0780, 0x07BF, "Thaana" },
{ 0x0900, 0x097F, "Devanagari" },
{ 0x0980, 0x09FF, "Bengali" },
{ 0x0A00, 0x0A7F, "Gurmukhi" },
{ 0x0A80, 0x0AFF, "Gujarati" },
{ 0x0B00, 0x0B7F, "Oriya" },
{ 0x0B80, 0x0BFF, "Tamil" },
{ 0x0C00, 0x0C7F, "Telugu" },
{ 0x0C80, 0x0CFF, "Kannada" },
{ 0x0D00, 0x0D7F, "Malayalam" },
{ 0x0D80, 0x0DFF, "Sinhala" },
{ 0x0E00, 0x0E7F, "Thai" },
{ 0x0E80, 0x0EFF, "Lao" },
{ 0x0F00, 0x0FFF, "Tibetan" },
{ 0x1000, 0x109F, "Myanmar" },
{ 0x10A0, 0x10FF, "Georgian" },
{ 0x1100, 0x11FF, "Hangul Jamo" },
{ 0x1200, 0x137F, "Ethiopic" },
{ 0x13A0, 0x13FF, "Cherokee" },
{ 0x1400, 0x167F, "Unified Canadian Aboriginal Syllabics" },
{ 0x1680, 0x169F, "Ogham" },
{ 0x16A0, 0x16FF, "Runic" },
{ 0x1700, 0x171F, "Tagalog" },
{ 0x1720, 0x173F, "Hanunoo" },
{ 0x1740, 0x175F, "Buhid" },
{ 0x1760, 0x177F, "Tagbanwa" },
{ 0x1780, 0x17FF, "Khmer" },
{ 0x1800, 0x18AF, "Mongolian" },
{ 0x1900, 0x194F, "Limbu" },
{ 0x1950, 0x197F, "Tai Le" },
{ 0x19E0, 0x19FF, "Khmer Symbols" },
{ 0x1D00, 0x1D7F, "Phonetic Extensions" },
{ 0x1E00, 0x1EFF, "Latin Extended Additional" },
{ 0x1F00, 0x1FFF, "Greek Extended" },
{ 0x2000, 0x206F, "General Punctuation" },
{ 0x2070, 0x209F, "Superscripts and Subscripts" },
{ 0x20A0, 0x20CF, "Currency Symbols" },
{ 0x20D0, 0x20FF, "Combining Diacritical Marks for Symbols" },
{ 0x2100, 0x214F, "Letterlike Symbols" },
{ 0x2150, 0x218F, "Number Forms" },
{ 0x2190, 0x21FF, "Arrows" },
{ 0x2200, 0x22FF, "Mathematical Operators" },
{ 0x2300, 0x23FF, "Miscellaneous Technical" },
{ 0x2400, 0x243F, "Control Pictures" },
{ 0x2440, 0x245F, "Optical Character Recognition" },
{ 0x2460, 0x24FF, "Enclosed Alphanumerics" },
{ 0x2500, 0x257F, "Box Drawing" },
{ 0x2580, 0x259F, "Block Elements" },
{ 0x25A0, 0x25FF, "Geometric Shapes" },
{ 0x2600, 0x26FF, "Miscellaneous Symbols" },
{ 0x2700, 0x27BF, "Dingbats" },
{ 0x27C0, 0x27EF, "Miscellaneous Mathematical Symbols, 0xA" },
{ 0x27F0, 0x27FF, "Supplemental Arrows, 0xA" },
{ 0x2800, 0x28FF, "Braille Patterns" },
{ 0x2900, 0x297F, "Supplemental Arrows, 0xB" },
{ 0x2980, 0x29FF, "Miscellaneous Mathematical Symbols, 0xB" },
{ 0x2A00, 0x2AFF, "Supplemental Mathematical Operators" },
{ 0x2B00, 0x2BFF, "Miscellaneous Symbols and Arrows" },
{ 0x2E80, 0x2EFF, "CJK Radicals Supplement" },
{ 0x2F00, 0x2FDF, "Kangxi Radicals" },
{ 0x2FF0, 0x2FFF, "Ideographic Description Characters" },
{ 0x3000, 0x303F, "CJK Symbols and Punctuation" },
{ 0x3040, 0x309F, "Hiragana" },
{ 0x30A0, 0x30FF, "Katakana" },
{ 0x3100, 0x312F, "Bopomofo" },
{ 0x3130, 0x318F, "Hangul Compatibility Jamo" },
{ 0x3190, 0x319F, "Kanbun" },
{ 0x31A0, 0x31BF, "Bopomofo Extended" },
{ 0x31F0, 0x31FF, "Katakana Phonetic Extensions" },
{ 0x3200, 0x32FF, "Enclosed CJK Letters and Months" },
{ 0x3300, 0x33FF, "CJK Compatibility" },
{ 0x3400, 0x4DBF, "CJK Unified Ideographs Extension A" },
{ 0x4DC0, 0x4DFF, "Yijing Hexagram Symbols" },
{ 0x4E00, 0x9FFF, "CJK Unified Ideographs" },
{ 0xA000, 0xA48F, "Yi Syllables" },
{ 0xA490, 0xA4CF, "Yi Radicals" },
{ 0xAC00, 0xD7AF, "Hangul Syllables" },
{ 0xD800, 0xDB7F, "High Surrogates" },
{ 0xDB80, 0xDBFF, "High Private Use Surrogates" },
{ 0xDC00, 0xDFFF, "Low Surrogates" },
{ 0xE000, 0xF8FF, "Private Use Area" },
{ 0xF900, 0xFAFF, "CJK Compatibility Ideographs" },
{ 0xFB00, 0xFB4F, "Alphabetic Presentation Forms" },
{ 0xFB50, 0xFDFF, "Arabic Presentation Forms, 0xA" },
{ 0xFE00, 0xFE0F, "Variation Selectors" },
{ 0xFE20, 0xFE2F, "Combining Half Marks" },
{ 0xFE30, 0xFE4F, "CJK Compatibility Forms" },
{ 0xFE50, 0xFE6F, "Small Form Variants" },
{ 0xFE70, 0xFEFF, "Arabic Presentation Forms, 0xB" },
{ 0xFF00, 0xFFEF, "Halfwidth and Fullwidth Forms" },
{ 0xFFF0, 0xFFFF, "Specials" },
{ 0x10000, 0x1007F, "Linear B Syllabary" },
{ 0x10080, 0x100FF, "Linear B Ideograms" },
{ 0x10100, 0x1013F, "Aegean Numbers" },
{ 0x10300, 0x1032F, "Old Italic" },
{ 0x10330, 0x1034F, "Gothic" },
{ 0x10380, 0x1039F, "Ugaritic" },
{ 0x10400, 0x1044F, "Deseret" },
{ 0x10450, 0x1047F, "Shavian" },
{ 0x10480, 0x104AF, "Osmanya" },
{ 0x10800, 0x1083F, "Cypriot Syllabary" },
{ 0x1D000, 0x1D0FF, "Byzantine Musical Symbols" },
{ 0x1D100, 0x1D1FF, "Musical Symbols" },
{ 0x1D300, 0x1D35F, "Tai Xuan Jing Symbols" },
{ 0x1D400, 0x1D7FF, "Mathematical Alphanumeric Symbols" },
{ 0x20000, 0x2A6DF, "CJK Unified Ideographs Extension B" },
{ 0x2F800, 0x2FA1F, "CJK Compatibility Ideographs Supplement" },
{ 0xE0000, 0xE007F, "Tags" } };
typedef struct
{
  uint32_t BitIndex;
  uint32_t FristCode;
  uint32_t LastCode;
  uint8_t * Description;
} UNICODE_RANGE_T;

const UNICODE_RANGE_T UnicodeRange[ ] =
{
{   0, 0x0000,  0x007F,   "BasicLatin"  },
{   1, 0x0080,  0x00FF,   "Latin-1Supplement"  },
{   2, 0x0100,  0x017F,   "LatinExtended-A"  },
{   3, 0x0180,  0x024F,   "LatinExtended-B"  },
{   4, 0x0250,  0x02AF,   "IPAExtensions"  },
{   5, 0x02B0,  0x02FF,   "SpacingModifierLetters"  },
{   5, 0xA700,  0xA71F,   "ModifierToneLetters"  },
{   6, 0x0300,  0x036F,   "CombiningDiacriticalMarks"  },
{   6, 0x1DC0,  0x1DFF,   "CombiningDiacriticalMarksSupplement"  },
{   7, 0x0370,  0x03FF,   "GreekandCoptic"  },
{   8, 0x2C80,  0x2CFF,   "Coptic"  },
{   9, 0x0400,  0x04FF,   "Cyrillic"  },
{   9, 0x0500,  0x052F,   "CyrillicSupplement"  },
{   9, 0x2DE0,  0x2DFF,   "CyrillicExtended-A"  },
{  10, 0x0530,  0x058F,   "Armenian"  },
{  10, 0xA640,  0xA69F,   "CyrillicExtended-B"  },
{  11, 0x0590,  0x05FF,   "Hebrew"  },
{  12, 0xA500,  0xA63F,   "Vai"  },
{  13, 0x0600,  0x06FF,   "Arabic"  },
{  13, 0x0750,  0x077F,   "ArabicSupplement"  },
{  14, 0x07C0,  0x07FF,   "NKo"  },
{  15, 0x0900,  0x097F,   "Devanagari"  },
{  16, 0x0980,  0x09FF,   "Bengali"  },
{  17, 0x0A00,  0x0A7F,   "Gurmukhi"  },
{  18, 0x0A80,  0x0AFF,   "Gujarati"  },
{  19, 0x0B00,  0x0B7F,   "Oriya"  },
{  20, 0x0B80,  0x0BFF,   "Tamil"  },
{  21, 0x0C00,  0x0C7F,   "Telugu"  },
{  22, 0x0C80,  0x0CFF,   "Kannada"  },
{  23, 0x0D00,  0x0D7F,   "Malayalam"  },
{  24, 0x0E00,  0x0E7F,   "Thai"  },
{  25, 0x0E80,  0x0EFF,   "Lao"  },
{  26, 0x10A0,  0x10FF,   "Georgian"  },
{  26, 0x2D00,  0x2D2F,   "GeorgianSupplement"  },
{  27, 0x1B00,  0x1B7F,   "Balinese"  },
{  28, 0x1100,  0x11FF,   "HangulJamo"  },
{  29, 0x1E00,  0x1EFF,   "LatinExtendedAdditional"  },
{  29, 0x2C60,  0x2C7F,   "LatinExtended-C"  },
{  29, 0xA720,  0xA7FF,   "LatinExtended-D"  },
{  30, 0x1F00,  0x1FFF,   "GreekExtended"  },
{  31, 0x2000,  0x206F,   "GeneralPunctuation"  },
{  31, 0x2E00,  0x2E7F,   "SupplementalPunctuation"  },
{  32, 0x2070,  0x209F,   "SuperscriptsAndSubscripts"  },
{  33, 0x20A0,  0x20CF,   "CurrencySymbols"  },
{  34, 0x20D0,  0x20FF,   "CombiningDiacriticalMarksForSymbols"  },
{  35, 0x2100,  0x214F,   "LetterlikeSymbols"  },
{  36, 0x2150,  0x218F,   "NumberForms"  },
{  37, 0x2190,  0x21FF,   "Arrows"  },
{  37, 0x27F0,  0x27FF,   "SupplementalArrows-A"  },
{  37, 0x2900,  0x297F,   "SupplementalArrows-B"  },
{  37, 0x2B00,  0x2BFF,   "MiscellaneousSymbolsandArrows"  },
{  38, 0x2200,  0x22FF,   "MathematicalOperators"  },
{  38, 0x27C0,  0x27EF,   "MiscellaneousMathematicalSymbols-A"  },
{  38, 0x2980,  0x29FF,   "MiscellaneousMathematicalSymbols-B"  },
{  38, 0x2A00,  0x2AFF,   "SupplementalMathematicalOperators"  },
{  39, 0x2300,  0x23FF,   "MiscellaneousTechnical"  },
{  4,  0x1D00,  0x1D7F,   "PhoneticExtensions"  },
{  4,  0x1D80,  0x1DBF,   "PhoneticExtensionsSupplement"  },
{  40, 0x2400,  0x243F,   "ControlPictures"  },
{  41, 0x2440,  0x245F,   "OpticalCharacterRecognition"  },
{  42, 0x2460,  0x24FF,   "EnclosedAlphanumerics"  },
{  43, 0x2500,  0x257F,   "BoxDrawing"  },
{  44, 0x2580,  0x259F,   "BlockElements"  },
{  45, 0x25A0,  0x25FF,   "GeometricShapes"  },
{  46, 0x2600,  0x26FF,   "MiscellaneousSymbols"  },
{  47, 0x2700,  0x27BF,   "Dingbats"  },
{  48, 0x3000,  0x303F,   "CJKSymbolsAndPunctuation"  },
{  49, 0x3040,  0x309F,   "Hiragana"  },
{  50, 0x30A0,  0x30FF,   "Katakana"  },
{  50, 0x31F0,  0x31FF,   "KatakanaPhoneticExtensions"  },
{  51, 0x3100,  0x312F,   "Bopomofo"  },
{  51, 0x31A0,  0x31BF,   "BopomofoExtended"  },
{  52, 0x3130,  0x318F,   "HangulCompatibilityJamo"  },
{  53, 0xA840,  0xA87F,   "Phags-pa"  },
{  54, 0x3200,  0x32FF,   "EnclosedCJKLettersAndMonths"  },
{  55, 0x3300,  0x33FF,   "CJKCompatibility"  },
{  56, 0xAC00,  0xD7AF,   "HangulSyllables"  },
{  57, 0xD800,  0xDFFF,   "Non-Plane0."  },
{  58, 0x10900, 0x1091F,  "Phoenician"  },
{  59, 0x20000, 0x2A6DF,  "CJKUnifiedIdeographsExtensionB"  },
{  59, 0x2E80,  0x2EFF,   "CJKRadicalsSupplement"  },
{  59, 0x2F00,  0x2FDF,   "KangxiRadicals"  },
{  59, 0x2FF0,  0x2FFF,   "IdeographicDescriptionCharacters"  },
{  59, 0x3190,  0x319F,   "Kanbun"  },
{  59, 0x3400,  0x4DBF,   "CJKUnifiedIdeographsExtensionA"  },
{  59, 0x4E00,  0x9FFF,   "CJKUnifiedIdeographs"  },
{  60, 0xE000,  0xF8FF,   "PrivateUseArea"  },
{  61, 0x2F800, 0x2FA1F,  "CJKCompatibilityIdeographsSupplement"  },
{  61, 0x31C0,  0x31EF,   "CJKStrokes"  },
{  61, 0xF900,  0xFAFF,   "CJKCompatibilityIdeographs"  },
{  62, 0xFB00,  0xFB4F,   "AlphabeticPresentationForms"  },
{  63, 0xFB50,  0xFDFF,   "ArabicPresentationForms-A"  },
{  64, 0xFE20,  0xFE2F,   "CombiningHalfMarks"  },
{  65, 0xFE10,  0xFE1F,   "VerticalForms"  },
{  65, 0xFE30,  0xFE4F,   "CJKCompatibilityForms"  },
{  66, 0xFE50,  0xFE6F,   "SmallFormVariants"  },
{  67, 0xFE70,  0xFEFF,   "ArabicPresentationForms-B"  },
{  68, 0xFF00,  0xFFEF,   "HalfwidthAndFullwidthForms"  },
{  69, 0xFFF0,  0xFFFF,   "Specials"  },
{  70, 0x0F00,  0x0FFF,   "Tibetan"  },
{  71, 0x0700,  0x074F,   "Syriac"  },
{  72, 0x0780,  0x07BF,   "Thaana"  },
{  73, 0x0D80,  0x0DFF,   "Sinhala"  },
{  74, 0x1000,  0x109F,   "Myanmar"  },
{  75, 0x1200,  0x137F,   "Ethiopic"  },
{  75, 0x1380,  0x139F,   "EthiopicSupplement"  },
{  75, 0x2D80,  0x2DDF,   "EthiopicExtended"  },
{  76, 0x13A0,  0x13FF,   "Cherokee"  },
{  77, 0x1400,  0x167F,   "UnifiedCanadianAboriginalSyllabics"  },
{  78, 0x1680,  0x169F,   "Ogham"  },
{  79, 0x16A0,  0x16FF,   "Runic"  },
{  80, 0x1780,  0x17FF,   "Khmer"  },
{  80, 0x19E0,  0x19FF,   "KhmerSymbols"  },
{  81, 0x1800,  0x18AF,   "Mongolian"  },
{  82, 0x2800,  0x28FF,   "BraillePatterns"  },
{  83, 0xA000,  0xA48F,   "YiSyllables"  },
{  83, 0xA490,  0xA4CF,   "YiRadicals"  },
{  84, 0x1700,  0x171F,   "Tagalog"  },
{  84, 0x1720,  0x173F,   "Hanunoo"  },
{  84, 0x1740,  0x175F,   "Buhid"  },
{  84, 0x1760,  0x177F,   "Tagbanwa"  },
{  85, 0x10300, 0x1032F,  "OldItalic"  },
{  86, 0x10330, 0x1034F,  "Gothic"  },
{  87, 0x10400, 0x1044F,  "Deseret"  },
{  88, 0x1D000, 0x1D0FF,  "ByzantineMusicalSymbols"  },
{  88, 0x1D100, 0x1D1FF,  "MusicalSymbols"  },
{  88, 0x1D200, 0x1D24F,  "AncientGreekMusicalNotation"  },
{  89, 0x1D400, 0x1D7FF,  "MathematicalAlphanumericSymbols"  },
{  90, 0x100000,0x10FFFD, "PrivateUse(plane16)"  },
{  90, 0xFF000, 0xFFFFD,  "PrivateUse(plane15)"  },
{  91, 0xE0100, 0xE01EF,  "VariationSelectorsSupplement"  },
{  91, 0xFE00,  0xFE0F,   "VariationSelectors"  },
{  92, 0xE0000, 0xE007F,  "Tags"  },
{  93, 0x1900,  0x194F,   "Limbu"  },
{  94, 0x1950,  0x197F,   "TaiLe"  },
{  95, 0x1980,  0x19DF,   "NewTaiLue"  },
{  96, 0x1A00,  0x1A1F,   "Buginese"  },
{  97, 0x2C00,  0x2C5F,   "Glagolitic"  },
{  98, 0x2D30,  0x2D7F,   "Tifinagh"  },
{  99, 0x4DC0,  0x4DFF,   "YijingHexagramSymbols"  },
{ 100, 0xA800,  0xA82F,   "SylotiNagri"  },
{ 101, 0x10000, 0x1007F,  "LinearBSyllabary"  },
{ 101, 0x10080, 0x100FF,  "LinearBIdeograms"  },
{ 101, 0x10100, 0x1013F,  "AegeanNumbers"  },
{ 102, 0x10140, 0x1018F,  "AncientGreekNumbers"  },
{ 103, 0x10380, 0x1039F,  "Ugaritic"  },
{ 104, 0x103A0, 0x103DF,  "OldPersian"  },
{ 105, 0x10450, 0x1047F,  "Shavian"  },
{ 106, 0x10480, 0x104AF,  "Osmanya"  },
{ 107, 0x10800, 0x1083F,  "CypriotSyllabary"  },
{ 108, 0x10A00, 0x10A5F,  "Kharoshthi"  },
{ 109, 0x1D300, 0x1D35F,  "TaiXuanJingSymbols"  },
{ 110, 0x12000, 0x123FF,  "Cuneiform"  },
{ 110, 0x12400, 0x1247F,  "CuneiformNumbersandPunctuation"  },
{ 111, 0x1D360, 0x1D37F,  "CountingRodNumerals"  },
{ 112, 0x1B80,  0x1BBF,   "Sundanese"  },
{ 113, 0x1C00,  0x1C4F,   "Lepcha"  },
{ 114, 0x1C50,  0x1C7F,   "OlChiki"  },
{ 115, 0xA880,  0xA8DF,   "Saurashtra"  },
{ 116, 0xA900,  0xA92F,   "KayahLi"  },
{ 117, 0xA930,  0xA95F,   "Rejang"  },
{ 118, 0xAA00,  0xAA5F,   "Cham"  },
{ 119, 0x10190, 0x101CF,  "AncientSymbols"  },
{ 120, 0x101D0, 0x101FF,  "PhaistosDisc"  },
{ 121, 0x10280, 0x1029F,  "Lycian"  },
{ 121, 0x102A0, 0x102DF,  "Carian"  },
{ 121, 0x10920, 0x1093F,  "Lydian"  },
{ 122, 0x1F000, 0x1F02F,  "MahjongTiles"  },
{ 122, 0x1F030, 0x1F09F,  "DominoTiles"  },
};

 

  

Unicode Character Ranges

In the following chart, the name of the range links to
the appropriate section of the Unicode standard on the Unicode web site.
These are PDF files. The beginning of the range is a link to an HTML chart.

0000007FBasic Latin
008000FFC1 Controls and Latin-1 Supplement
0100017FLatin Extended-A
0180024FLatin Extended-B
025002AFIPA Extensions
02B002FFSpacing Modifier Letters
0300036FCombining Diacritical Marks
037003FFGreek/Coptic
040004FFCyrillic
0500052FCyrillic Supplement
0530058FArmenian
059005FFHebrew
060006FFArabic
0700074FSyriac
0750077FUndefined
078007BFThaana
07C008FFUndefined
0900097FDevanagari
098009FFBengali/Assamese
0A000A7FGurmukhi
0A800AFFGujarati
0B000B7FOriya
0B800BFFTamil
0C000C7FTelugu
0C800CFFKannada
0D000DFFMalayalam
0D800DFFSinhala
0E000E7FThai
0E800EFFLao
0F000FFFTibetan
1000109FMyanmar
10A010FFGeorgian
110011FFHangul Jamo
1200137FEthiopic
1380139FUndefined
13A013FFCherokee
1400167FUnified Canadian Aboriginal Syllabics
1680169FOgham
16A016FFRunic
1700171FTagalog
1720173FHanunoo
1740175FBuhid
1760177FTagbanwa
178017FFKhmer
180018AFMongolian
18B018FFUndefined
1900194FLimbu
1950197FTai Le
198019DFUndefined
19E019FFKhmer Symbols
1A001CFFUndefined
1D001D7FPhonetic Extensions
1D801DFFUndefined
1E001EFFLatin Extended Additional
1F001FFFGreek Extended
2000206FGeneral Punctuation
2070209FSuperscripts and Subscripts
20A020CFCurrency Symbols
20D020FFCombining Diacritical Marks for Symbols
2100214FLetterlike Symbols
2150218FNumber Forms
219021FFArrows
220022FFMathematical Operators
230023FFMiscellaneous Technical
2400243FControl Pictures
2440245FOptical Character Recognition
246024FFEnclosed Alphanumerics
2500257FBox Drawing
2580259FBlock Elements
25A025FFGeometric Shapes
260026FFMiscellaneous Symbols
270027BFDingbats
27C027EFMiscellaneous Mathematical Symbols-A
27F027FFSupplemental Arrows-A
280028FFBraille Patterns
2900297FSupplemental Arrows-B
298029FFMiscellaneous Mathematical Symbols-B
2A002AFFSupplemental Mathematical Operators
2B002BFFMiscellaneous Symbols and Arrows
2C002E7FUndefined
2E802EFFCJK Radicals Supplement
2F002FDFKangxi Radicals
2FE02FEFUndefined
2FF02FFFIdeographic Description Characters
3000303FCJK Symbols and Punctuation
3040309FHiragana
30A030FFKatakana
3100312FBopomofo
3130318FHangul Compatibility Jamo
3190319FKanbun (Kunten)
31A031BFBopomofo Extended
31C031EFUndefined
31F031FFKatakana Phonetic Extensions
320032FFEnclosed CJK Letters and Months
330033FFCJK Compatibility
34004DBFCJK Unified Ideographs Extension A
4DC04DFFYijing Hexagram Symbols
4E009FAFCJK Unified Ideographs
9FB09FFFUndefined
A000A48FYi Syllables
A490A4CFYi Radicals
A4D0ABFFUndefined
AC00D7AFHangul Syllables
D7B0D7FFUndefined
D800DBFFHigh Surrogate Area
DC00DFFFLow Surrogate Area
E000F8FFPrivate Use Area
F900FAFFCJK Compatibility Ideographs
FB00FB4FAlphabetic Presentation Forms
FB50FDFFArabic Presentation Forms-A
FE00FE0FVariation Selectors
FE10FE1FUndefined
FE20FE2FCombining Half Marks
FE30FE4FCJK Compatibility Forms
FE50FE6FSmall Form Variants
FE70FEFFArabic Presentation Forms-B
FF00FFEFHalfwidth and Fullwidth Forms
FFF0FFFFSpecials
100001007FLinear B Syllabary
10080100FFLinear B Ideograms
101001013FAegean Numbers
10140102FFUndefined
103001032FOld Italic
103301034FGothic
103801039FUgaritic
104001044FDeseret
104501047FShavian
10480104AFOsmanya
104B0107FFUndefined
108001083FCypriot Syllabary
108401CFFFUndefined
1D0001D0FFByzantine Musical Symbols
1D1001D1FFMusical Symbols
1D2001D2FFUndefined
1D3001D35FTai Xuan Jing Symbols
1D3601D3FFUndefined
1D4001D7FFMathematical Alphanumeric Symbols
1D8001FFFFUndefined
200002A6DFCJK Unified Ideographs Extension B
2A6E02F7FFUndefined
2F8002FA1FCJK Compatibility Ideographs Supplement
2FAB0DFFFFUnused
E0000E007FTags
E0080E00FFUnused
E0100E01EFVariation Selectors Supplement
E01F0EFFFFUnused
F0000FFFFDSupplementary Private Use Area-A
FFFFEFFFFFUnused
10000010FFFDSupplementary Private Use Area-B

Unicode Character Ranges

0020 — 007F  Basic Latin 2580 — 259F  Block Elements
00A0 — 00FF  Latin-1 Supplement 25A0 — 25FF  Geometric Shapes
0100 — 017F  Latin Extended-A 2600 — 26FF  Miscellaneous Symbols
0180 — 024F  Latin Extended-B 2700 — 27BF  Dingbats
0250 — 02AF  IPA Extensions 27C0 — 27EF  Miscellaneous Mathematical Symbols-A
02B0 — 02FF  Spacing Modifier Letters 27F0 — 27FF  Supplemental Arrows-A
0300 — 036F  Combining Diacritical Marks 2800 — 28FF  Braille Patterns
0370 — 03FF  Greek and Coptic 2900 — 297F  Supplemental Arrows-B
0400 — 04FF  Cyrillic 2980 — 29FF  Miscellaneous Mathematical Symbols-B
0500 — 052F  Cyrillic Supplementary 2A00 — 2AFF  Supplemental Mathematical Operators
0530 — 058F  Armenian 2B00 — 2BFF  Miscellaneous Symbols and Arrows
0590 — 05FF  Hebrew 2E80 — 2EFF  CJK Radicals Supplement
0600 — 06FF  Arabic 2F00 — 2FDF  Kangxi Radicals
0700 — 074F  Syriac 2FF0 — 2FFF  Ideographic Description Characters
0780 — 07BF  Thaana 3000 — 303F  CJK Symbols and Punctuation
0900 — 097F  Devanagari 3040 — 309F  Hiragana
0980 — 09FF  Bengali 30A0 — 30FF  Katakana
0A00 — 0A7F  Gurmukhi 3100 — 312F  Bopomofo
0A80 — 0AFF  Gujarati 3130 — 318F  Hangul Compatibility Jamo
0B00 — 0B7F  Oriya 3190 — 319F  Kanbun
0B80 — 0BFF  Tamil 31A0 — 31BF  Bopomofo Extended
0C00 — 0C7F  Telugu 31F0 — 31FF  Katakana Phonetic Extensions
0C80 — 0CFF  Kannada 3200 — 32FF  Enclosed CJK Letters and Months
0D00 — 0D7F  Malayalam 3300 — 33FF  CJK Compatibility
0D80 — 0DFF  Sinhala 3400 — 4DBF  CJK Unified Ideographs Extension A
0E00 — 0E7F  Thai 4DC0 — 4DFF  Yijing Hexagram Symbols
0E80 — 0EFF  Lao 4E00 — 9FFF  CJK Unified Ideographs
0F00 — 0FFF  Tibetan A000 — A48F  Yi Syllables
1000 — 109F  Myanmar A490 — A4CF  Yi Radicals
10A0 — 10FF  Georgian AC00 — D7AF  Hangul Syllables
1100 — 11FF  Hangul Jamo D800 — DB7F  High Surrogates
1200 — 137F  Ethiopic DB80 — DBFF  High Private Use Surrogates
13A0 — 13FF  Cherokee DC00 — DFFF  Low Surrogates
1400 — 167F  Unified Canadian Aboriginal Syllabics E000 — F8FF  Private Use Area
1680 — 169F  Ogham F900 — FAFF  CJK Compatibility Ideographs
16A0 — 16FF  Runic FB00 — FB4F  Alphabetic Presentation Forms
1700 — 171F  Tagalog FB50 — FDFF  Arabic Presentation Forms-A
1720 — 173F  Hanunoo FE00 — FE0F  Variation Selectors
1740 — 175F  Buhid FE20 — FE2F  Combining Half Marks
1760 — 177F  Tagbanwa FE30 — FE4F  CJK Compatibility Forms
1780 — 17FF  Khmer FE50 — FE6F  Small Form Variants
1800 — 18AF  Mongolian FE70 — FEFF  Arabic Presentation Forms-B
1900 — 194F  Limbu FF00 — FFEF  Halfwidth and Fullwidth Forms
1950 — 197F  Tai Le FFF0 — FFFF  Specials
19E0 — 19FF  Khmer Symbols 10000 — 1007F  Linear B Syllabary
1D00 — 1D7F  Phonetic Extensions 10080 — 100FF  Linear B Ideograms
1E00 — 1EFF  Latin Extended Additional 10100 — 1013F  Aegean Numbers
1F00 — 1FFF  Greek Extended 10300 — 1032F  Old Italic
2000 — 206F  General Punctuation 10330 — 1034F  Gothic
2070 — 209F  Superscripts and Subscripts 10380 — 1039F  Ugaritic
20A0 — 20CF  Currency Symbols 10400 — 1044F  Deseret
20D0 — 20FF  Combining Diacritical Marks for Symbols 10450 — 1047F  Shavian
2100 — 214F  Letterlike Symbols 10480 — 104AF  Osmanya
2150 — 218F  Number Forms 10800 — 1083F  Cypriot Syllabary
2190 — 21FF  Arrows 1D000 — 1D0FF  Byzantine Musical Symbols
2200 — 22FF  Mathematical Operators 1D100 — 1D1FF  Musical Symbols
2300 — 23FF  Miscellaneous Technical 1D300 — 1D35F  Tai Xuan Jing Symbols
2400 — 243F  Control Pictures 1D400 — 1D7FF  Mathematical Alphanumeric Symbols
2440 — 245F  Optical Character Recognition 20000 — 2A6DF  CJK Unified Ideographs Extension B
2460 — 24FF  Enclosed Alphanumerics 2F800 — 2FA1F  CJK Compatibility Ideographs Supplement
2500 — 257F  Box Drawing E0000 — E007F  Tags

 

 

转载于:https://www.cnblogs.com/shangdawei/archive/2013/05/12/3074438.html

评论
添加红包

请填写红包祝福语或标题

红包个数最小为10个

红包金额最低5元

当前余额3.43前往充值 >
需支付:10.00
成就一亿技术人!
领取后你会自动成为博主和红包主的粉丝 规则
hope_wisdom
发出的红包
实付
使用余额支付
点击重新获取
扫码支付
钱包余额 0

抵扣说明:

1.余额是钱包充值的虚拟货币,按照1:1的比例进行支付金额的抵扣。
2.余额无法直接购买下载,可以购买VIP、付费专栏及课程。

余额充值