Unicode Property List

character | properties | unicode-set | compare-sets | help

Age [string]
® alnum False, True
Alphabetic False, True
ASCII_Hex_Digit False, True
Bidi_Class Arabic_Letter, Arabic_Number, Boundary_Neutral, Common_Separator, European_Number, European_Separator, European_Terminator, Left_To_Right, Left_To_Right_Embedding, Left_To_Right_Override, Nonspacing_Mark, Other_Neutral, Paragraph_Separator, Pop_Directional_Format, Right_To_Left, Right_To_Left_Embedding, Right_To_Left_Override, Segment_Separator, White_Space
Bidi_Control False, True
Bidi_Mirrored False, True
Bidi_Mirroring_Glyph [string]
® blank False, True
Block Aegean_Numbers, Alphabetic_Presentation_Forms, Ancient_Greek_Musical_Notation, Ancient_Greek_Numbers, Ancient_Symbols, Arabic, Arabic_Presentation_Forms_A, Arabic_Presentation_Forms_B, Arabic_Supplement, Armenian, Arrows, Balinese, Basic_Latin, Bengali, Block_Elements, Bopomofo, Bopomofo_Extended, Box_Drawing, Braille_Patterns, Buginese, Buhid, Byzantine_Musical_Symbols, Carian, Cham, Cherokee, CJK_Compatibility, CJK_Compatibility_Forms, CJK_Compatibility_Ideographs, CJK_Compatibility_Ideographs_Supplement, CJK_Radicals_Supplement, CJK_Strokes, CJK_Symbols_And_Punctuation, CJK_Unified_Ideographs, CJK_Unified_Ideographs_Extension_A, CJK_Unified_Ideographs_Extension_B, Combining_Diacritical_Marks, Combining_Diacritical_Marks_For_Symbols, Combining_Diacritical_Marks_Supplement, Combining_Half_Marks, Control_Pictures, Coptic, Counting_Rod_Numerals, Cuneiform, Cuneiform_Numbers_And_Punctuation, Currency_Symbols, Cypriot_Syllabary, Cyrillic, Cyrillic_Extended_A, Cyrillic_Extended_B, Cyrillic_Supplement, Deseret, Devanagari, Dingbats, Domino_Tiles, Enclosed_Alphanumerics, Enclosed_CJK_Letters_And_Months, Ethiopic, Ethiopic_Extended, Ethiopic_Supplement, General_Punctuation, Geometric_Shapes, Georgian, Georgian_Supplement, Glagolitic, Gothic, Greek_And_Coptic, Greek_Extended, Gujarati, Gurmukhi, Halfwidth_And_Fullwidth_Forms, Hangul_Compatibility_Jamo, Hangul_Jamo, Hangul_Syllables, Hanunoo, Hebrew, High_Private_Use_Surrogates, High_Surrogates, Hiragana, Ideographic_Description_Characters, IPA_Extensions, Kanbun, Kangxi_Radicals, Kannada, Katakana, Katakana_Phonetic_Extensions, Kayah_Li, Kharoshthi, Khmer, Khmer_Symbols, Lao, Latin_1_Supplement, Latin_Extended_A, Latin_Extended_Additional, Latin_Extended_B, Latin_Extended_C, Latin_Extended_D, Lepcha, Letterlike_Symbols, Limbu, Linear_B_Ideograms, Linear_B_Syllabary, Low_Surrogates, Lycian, Lydian, Mahjong_Tiles, Malayalam, Mathematical_Alphanumeric_Symbols, Mathematical_Operators, Miscellaneous_Mathematical_Symbols_A, Miscellaneous_Mathematical_Symbols_B, Miscellaneous_Symbols, Miscellaneous_Symbols_And_Arrows, Miscellaneous_Technical, Modifier_Tone_Letters, Mongolian, Musical_Symbols, Myanmar, New_Tai_Lue, NKo, No_Block, Number_Forms, Ogham, Ol_Chiki, Old_Italic, Old_Persian, Optical_Character_Recognition, Oriya, Osmanya, Phags_Pa, Phaistos_Disc, Phoenician, Phonetic_Extensions, Phonetic_Extensions_Supplement, Private_Use_Area, Rejang, Runic, Saurashtra, Shavian, Sinhala, Small_Form_Variants, Spacing_Modifier_Letters, Specials, Sundanese, Superscripts_And_Subscripts, Supplemental_Arrows_A, Supplemental_Arrows_B, Supplemental_Mathematical_Operators, Supplemental_Punctuation, Supplementary_Private_Use_Area_A, Supplementary_Private_Use_Area_B, Syloti_Nagri, Syriac, Tagalog, Tagbanwa, Tags, Tai_Le, Tai_Xuan_Jing_Symbols, Tamil, Telugu, Thaana, Thai, Tibetan, Tifinagh, Ugaritic, Unified_Canadian_Aboriginal_Syllabics, Vai, Variation_Selectors, Variation_Selectors_Supplement, Vertical_Forms, Yi_Radicals, Yi_Syllables, Yijing_Hexagram_Symbols
Canonical_Combining_Class 10, 11, 12, 13, 14, 15, 16, 17, 18, 19, 20, 21, 22, 23, 24, 25, 26, 27, 28, 29, 30, 31, 32, 33, 34, 35, 36, 84, 91, 103, 107, 118, 122, 129, 130, 132, 214, Above, Above_Left, Above_Right, Attached_Above_Right, Attached_Below, Attached_Below_Left, Below, Below_Left, Below_Right, Double_Above, Double_Below, Iota_Subscript, Kana_Voicing, Left, Not_Reordered, Nukta, Overlay, Right, Virama
Case_Folding [string]
© Case_Sensitive False, True
Dash False, True
Decomposition_Type Canonical, Circle, Compat, Final, font, Fraction, Initial, Isolated, Medial, Narrow, Nobreak, none, Small, Square, sub, Super, Vertical, wide
Default_Ignorable_Code_Point False, True
Deprecated False, True
Diacritic False, True
East_Asian_Width Ambiguous, Fullwidth, Halfwidth, Narrow, Neutral, Wide
Extender False, True
Full_Composition_Exclusion False, True
General_Category Close_Punctuation, Connector_Punctuation, Control, Currency_Symbol, Dash_Punctuation, Decimal_Number, Enclosing_Mark, Final_Punctuation, Format, Initial_Punctuation, Letter_Number, Line_Separator, Lowercase_Letter, Math_Symbol, Modifier_Letter, Modifier_Symbol, Nonspacing_Mark, Open_Punctuation, Other_Letter, Other_Number, Other_Punctuation, Other_Symbol, Paragraph_Separator, Private_Use, Space_Separator, Spacing_Mark, Surrogate, Titlecase_Letter, Unassigned, Uppercase_Letter
® graph False, True
Grapheme_Base False, True
Grapheme_Cluster_Break Control, CR, Extend, L, LF, LV, LVT, Other, Prepend, SpacingMark, T, V
Grapheme_Extend False, True
Grapheme_Link False, True
Hangul_Syllable_Type Leading_Jamo, LV_Syllable, LVT_Syllable, Not_Applicable, Trailing_Jamo, Vowel_Jamo
Hex_Digit False, True
Hyphen False, True
ID_Continue False, True
ID_Start False, True
Ideographic False, True
IDS_Binary_Operator False, True
IDS_Trinary_Operator False, True
ISO_Comment [string]
Join_Control False, True
Joining_Group Ain, Alaph, Alef, Beh, Beth, Burushaski_Yeh_Barree, Dal, Dalath_Rish, E, Fe, Feh, Final_Semkath, Gaf, Gamal, Hah, Hamza_On_Heh_Goal, He, Heh, Heh_Goal, Heth, Kaf, Kaph, Khaph, Knotted_Heh, Lam, Lamadh, Meem, Mim, No_Joining_Group, Noon, Nun, Pe, Qaf, Qaph, Reh, Reversed_Pe, Sad, Sadhe, Seen, Semkath, Shin, Swash_Kaf, Syriac_Waw, Tah, Taw, Teh_Marbuta, Teth, Waw, Yeh, Yeh_Barree, Yeh_With_Tail, Yudh, Yudh_He, Zain, Zhain
Joining_Type Dual_Joining, Join_Causing, Left_Joining, Non_Joining, Right_Joining, Transparent
© Lead_Canonical_Combining_Class Above, Above_Left, Above_Right, Attached_Above_Right, Attached_Below, Attached_Below_Left, Below, Below_Left, Below_Right, Double_Above, Double_Below, Iota_Subscript, Kana_Voicing, Left, Not_Reordered, Nukta, Overlay, Right, Virama
Line_Break Alphabetic, Ambiguous, Break_After, Break_Before, Break_Both, Break_Symbols, Carriage_Return, Close_Punctuation, Combining_Mark, Complex_Context, Contingent_Break, Exclamation, Glue, H2, H3, Hyphen, Ideographic, Infix_Numeric, Inseparable, JL, JT, JV, Line_Feed, Mandatory_Break, Next_Line, Nonstarter, Numeric, Open_Punctuation, Postfix_Numeric, Prefix_Numeric, Quotation, Space, Surrogate, Unknown, Word_Joiner, ZWSpace
Logical_Order_Exception False, True
Lowercase False, True
Lowercase_Mapping [string]
Math False, True
Name [string]
© NFC_Inert False, True
NFC_Quick_Check Maybe, No, Yes
© NFD_Inert False, True
NFD_Quick_Check No, Yes
© NFKC_Inert False, True
NFKC_Quick_Check Maybe, No, Yes
© NFKD_Inert False, True
NFKD_Quick_Check No, Yes
Noncharacter_Code_Point False, True
Numeric_Type Decimal, Digit, None, Numeric
Numeric_Value [double]
Pattern_Syntax False, True
Pattern_White_Space False, True
® print False, True
Quotation_Mark False, True
Radical False, True
Script Arabic, Armenian, Armi, Avst, Balinese, Batk, Bengali, Blis, Bopomofo, Brah, Braille, Buginese, Buhid, Cakm, Canadian_Aboriginal, Carian, Cham, Cherokee, Cirt, Common, Coptic, Cuneiform, Cypriot, Cyrillic, Cyrs, Deseret, Devanagari, Egyd, Egyh, Egyp, Ethiopic, Geok, Georgian, Glagolitic, Gothic, Greek, Gujarati, Gurmukhi, Han, Hangul, Hans, Hant, Hanunoo, Hebrew, Hiragana, Hmng, Hung, Inds, Inherited, Java, Jpan, Kannada, Katakana, Katakana_Or_Hiragana, Kayah_Li, Kharoshthi, Khmer, Kore, Kthi, Lana, Lao, Latf, Latg, Latin, Lepcha, Limbu, Lina, Linear_B, Lycian, Lydian, Malayalam, Mand, Mani, Maya, Mero, Mongolian, Moon, Mtei, Myanmar, New_Tai_Lue, Nko, Ogham, Ol_Chiki, Old_Italic, Old_Persian, Oriya, Orkh, Osmanya, Perm, Phags_Pa, Phli, Phlp, Phlv, Phoenician, Plrd, Prti, Rejang, Roro, Runic, Samr, Sara, Saurashtra, Sgnw, Shavian, Sinhala, Sundanese, Syloti_Nagri, Syre, Syriac, Syrj, Syrn, Tagalog, Tagbanwa, Tai_Le, Tamil, Tavt, Telugu, Teng, Thaana, Thai, Tibetan, Tifinagh, Ugaritic, Unknown, Vai, Visp, Yi, Zmth, Zsym, Zxxx
© Segment_Starter False, True
Sentence_Break ATerm, Close, CR, Extend, Format, LF, Lower, Numeric, OLetter, Other, SContinue, Sep, Sp, STerm, Upper
Simple_Case_Folding [string]
Simple_Lowercase_Mapping [string]
Simple_Titlecase_Mapping [string]
Simple_Uppercase_Mapping [string]
Soft_Dotted False, True
STerm False, True
Terminal_Punctuation False, True
Titlecase_Mapping [string]
© Trail_Canonical_Combining_Class Above, Above_Left, Above_Right, Attached_Above_Right, Attached_Below, Attached_Below_Left, Below, Below_Left, Below_Right, Double_Above, Double_Below, Iota_Subscript, Kana_Voicing, Left, Not_Reordered, Nukta, Overlay, Right, Virama
Unicode_1_Name [string]
Unified_Ideograph False, True
Uppercase False, True
Uppercase_Mapping [string]
Variation_Selector False, True
White_Space False, True
Word_Break ALetter, CR, Extend, ExtendNumLet, Format, Katakana, LF, MidLetter, MidNum, MidNumLet, Newline, Numeric, Other
® xdigit False, True
XID_Continue False, True
XID_Start False, True

® = Regex Property (UTS #18): not formal Unicode property
© = ICU-Only Property (not Unicode or Regex)
Not explicitly in ICU: [Composition_Exclusion, Decomposition_Mapping, Expands_On_NFC, Expands_On_NFD, Expands_On_NFKC, Expands_On_NFKD, FC_NFKC_Closure, Other_Alphabetic, Other_Default_Ignorable_Code_Point, Other_Grapheme_Extend, Other_ID_Continue, Other_ID_Start, Other_Lowercase, Other_Math, Other_Uppercase, Special_Case_Condition, Unicode_Radical_Stroke, word]

Built with ICU version: 4.1.1.0