| /************************************************* |
| * Unicode Property Table handler * |
| *************************************************/ |
| |
| #ifndef _UCP_H |
| #define _UCP_H |
| |
| /* This file contains definitions of the property values that are returned by |
| the function _pcre_ucp_findprop(). New values that are added for new releases |
| of Unicode should always be at the end of each enum, for backwards |
| compatibility. */ |
| |
| /* These are the general character categories. */ |
| |
| enum { |
| ucp_C, /* Other */ |
| ucp_L, /* Letter */ |
| ucp_M, /* Mark */ |
| ucp_N, /* Number */ |
| ucp_P, /* Punctuation */ |
| ucp_S, /* Symbol */ |
| ucp_Z /* Separator */ |
| }; |
| |
| /* These are the particular character types. */ |
| |
| enum { |
| ucp_Cc, /* Control */ |
| ucp_Cf, /* Format */ |
| ucp_Cn, /* Unassigned */ |
| ucp_Co, /* Private use */ |
| ucp_Cs, /* Surrogate */ |
| ucp_Ll, /* Lower case letter */ |
| ucp_Lm, /* Modifier letter */ |
| ucp_Lo, /* Other letter */ |
| ucp_Lt, /* Title case letter */ |
| ucp_Lu, /* Upper case letter */ |
| ucp_Mc, /* Spacing mark */ |
| ucp_Me, /* Enclosing mark */ |
| ucp_Mn, /* Non-spacing mark */ |
| ucp_Nd, /* Decimal number */ |
| ucp_Nl, /* Letter number */ |
| ucp_No, /* Other number */ |
| ucp_Pc, /* Connector punctuation */ |
| ucp_Pd, /* Dash punctuation */ |
| ucp_Pe, /* Close punctuation */ |
| ucp_Pf, /* Final punctuation */ |
| ucp_Pi, /* Initial punctuation */ |
| ucp_Po, /* Other punctuation */ |
| ucp_Ps, /* Open punctuation */ |
| ucp_Sc, /* Currency symbol */ |
| ucp_Sk, /* Modifier symbol */ |
| ucp_Sm, /* Mathematical symbol */ |
| ucp_So, /* Other symbol */ |
| ucp_Zl, /* Line separator */ |
| ucp_Zp, /* Paragraph separator */ |
| ucp_Zs /* Space separator */ |
| }; |
| |
| /* These are the script identifications. */ |
| |
| enum { |
| ucp_Arabic = G_UNICODE_SCRIPT_ARABIC, |
| ucp_Armenian = G_UNICODE_SCRIPT_ARMENIAN, |
| ucp_Bengali = G_UNICODE_SCRIPT_BENGALI, |
| ucp_Bopomofo = G_UNICODE_SCRIPT_BOPOMOFO, |
| ucp_Braille = G_UNICODE_SCRIPT_BRAILLE, |
| ucp_Buginese = G_UNICODE_SCRIPT_BUGINESE, |
| ucp_Buhid = G_UNICODE_SCRIPT_BUHID, |
| ucp_Canadian_Aboriginal = G_UNICODE_SCRIPT_CANADIAN_ABORIGINAL, |
| ucp_Cherokee = G_UNICODE_SCRIPT_CHEROKEE, |
| ucp_Common = G_UNICODE_SCRIPT_COMMON, |
| ucp_Coptic = G_UNICODE_SCRIPT_COPTIC, |
| ucp_Cypriot = G_UNICODE_SCRIPT_CYPRIOT, |
| ucp_Cyrillic = G_UNICODE_SCRIPT_CYRILLIC, |
| ucp_Deseret = G_UNICODE_SCRIPT_DESERET, |
| ucp_Devanagari = G_UNICODE_SCRIPT_DEVANAGARI, |
| ucp_Ethiopic = G_UNICODE_SCRIPT_ETHIOPIC, |
| ucp_Georgian = G_UNICODE_SCRIPT_GEORGIAN, |
| ucp_Glagolitic = G_UNICODE_SCRIPT_GLAGOLITIC, |
| ucp_Gothic = G_UNICODE_SCRIPT_GOTHIC, |
| ucp_Greek = G_UNICODE_SCRIPT_GREEK, |
| ucp_Gujarati = G_UNICODE_SCRIPT_GUJARATI, |
| ucp_Gurmukhi = G_UNICODE_SCRIPT_GURMUKHI, |
| ucp_Han = G_UNICODE_SCRIPT_HAN, |
| ucp_Hangul = G_UNICODE_SCRIPT_HANGUL, |
| ucp_Hanunoo = G_UNICODE_SCRIPT_HANUNOO, |
| ucp_Hebrew = G_UNICODE_SCRIPT_HEBREW, |
| ucp_Hiragana = G_UNICODE_SCRIPT_HIRAGANA, |
| ucp_Inherited = G_UNICODE_SCRIPT_INHERITED, |
| ucp_Kannada = G_UNICODE_SCRIPT_KANNADA, |
| ucp_Katakana = G_UNICODE_SCRIPT_KATAKANA, |
| ucp_Kharoshthi = G_UNICODE_SCRIPT_KHAROSHTHI, |
| ucp_Khmer = G_UNICODE_SCRIPT_KHMER, |
| ucp_Lao = G_UNICODE_SCRIPT_LAO, |
| ucp_Latin = G_UNICODE_SCRIPT_LATIN, |
| ucp_Limbu = G_UNICODE_SCRIPT_LIMBU, |
| ucp_Linear_B = G_UNICODE_SCRIPT_LINEAR_B, |
| ucp_Malayalam = G_UNICODE_SCRIPT_MALAYALAM, |
| ucp_Mongolian = G_UNICODE_SCRIPT_MONGOLIAN, |
| ucp_Myanmar = G_UNICODE_SCRIPT_MYANMAR, |
| ucp_New_Tai_Lue = G_UNICODE_SCRIPT_NEW_TAI_LUE, |
| ucp_Ogham = G_UNICODE_SCRIPT_OGHAM, |
| ucp_Old_Italic = G_UNICODE_SCRIPT_OLD_ITALIC, |
| ucp_Old_Persian = G_UNICODE_SCRIPT_OLD_PERSIAN, |
| ucp_Oriya = G_UNICODE_SCRIPT_ORIYA, |
| ucp_Osmanya = G_UNICODE_SCRIPT_OSMANYA, |
| ucp_Runic = G_UNICODE_SCRIPT_RUNIC, |
| ucp_Shavian = G_UNICODE_SCRIPT_SHAVIAN, |
| ucp_Sinhala = G_UNICODE_SCRIPT_SINHALA, |
| ucp_Syloti_Nagri = G_UNICODE_SCRIPT_SYLOTI_NAGRI, |
| ucp_Syriac = G_UNICODE_SCRIPT_SYRIAC, |
| ucp_Tagalog = G_UNICODE_SCRIPT_TAGALOG, |
| ucp_Tagbanwa = G_UNICODE_SCRIPT_TAGBANWA, |
| ucp_Tai_Le = G_UNICODE_SCRIPT_TAI_LE, |
| ucp_Tamil = G_UNICODE_SCRIPT_TAMIL, |
| ucp_Telugu = G_UNICODE_SCRIPT_TELUGU, |
| ucp_Thaana = G_UNICODE_SCRIPT_THAANA, |
| ucp_Thai = G_UNICODE_SCRIPT_THAI, |
| ucp_Tibetan = G_UNICODE_SCRIPT_TIBETAN, |
| ucp_Tifinagh = G_UNICODE_SCRIPT_TIFINAGH, |
| ucp_Ugaritic = G_UNICODE_SCRIPT_UGARITIC, |
| ucp_Yi = G_UNICODE_SCRIPT_YI, |
| ucp_Balinese = G_UNICODE_SCRIPT_BALINESE, /* New for Unicode 5.0.0 */ |
| ucp_Cuneiform = G_UNICODE_SCRIPT_CUNEIFORM, /* New for Unicode 5.0.0 */ |
| ucp_Nko = G_UNICODE_SCRIPT_NKO, /* New for Unicode 5.0.0 */ |
| ucp_Phags_Pa = G_UNICODE_SCRIPT_PHAGS_PA, /* New for Unicode 5.0.0 */ |
| ucp_Phoenician = G_UNICODE_SCRIPT_PHOENICIAN, /* New for Unicode 5.0.0 */ |
| ucp_Carian = G_UNICODE_SCRIPT_CARIAN, /* New for Unicode 5.1 */ |
| ucp_Cham = G_UNICODE_SCRIPT_CHAM, /* New for Unicode 5.1 */ |
| ucp_Kayah_Li = G_UNICODE_SCRIPT_KAYAH_LI, /* New for Unicode 5.1 */ |
| ucp_Lepcha = G_UNICODE_SCRIPT_LEPCHA, /* New for Unicode 5.1 */ |
| ucp_Lycian = G_UNICODE_SCRIPT_LYCIAN, /* New for Unicode 5.1 */ |
| ucp_Lydian = G_UNICODE_SCRIPT_LYDIAN, /* New for Unicode 5.1 */ |
| ucp_Ol_Chiki = G_UNICODE_SCRIPT_OL_CHIKI, /* New for Unicode 5.1 */ |
| ucp_Rejang = G_UNICODE_SCRIPT_REJANG, /* New for Unicode 5.1 */ |
| ucp_Saurashtra = G_UNICODE_SCRIPT_SAURASHTRA, /* New for Unicode 5.1 */ |
| ucp_Sundanese = G_UNICODE_SCRIPT_SUNDANESE, /* New for Unicode 5.1 */ |
| ucp_Vai = G_UNICODE_SCRIPT_VAI /* New for Unicode 5.1 */ |
| }; |
| |
| #endif |
| |
| /* End of ucp.h */ |