blob: fe910ce0031fc325e7dcb5ecc14fb0cea75dd51d [file] [log] [blame]
/*************************************************
* Unicode Property Table handler *
*************************************************/
#ifndef _UCP_H
#define _UCP_H
/* This file contains definitions of the property values that are returned by
the function _pcre_ucp_findprop(). New values that are added for new releases
of Unicode should always be at the end of each enum, for backwards
compatibility. */
/* These are the general character categories. */
enum {
ucp_C, /* Other */
ucp_L, /* Letter */
ucp_M, /* Mark */
ucp_N, /* Number */
ucp_P, /* Punctuation */
ucp_S, /* Symbol */
ucp_Z /* Separator */
};
/* These are the particular character types. */
enum {
ucp_Cc, /* Control */
ucp_Cf, /* Format */
ucp_Cn, /* Unassigned */
ucp_Co, /* Private use */
ucp_Cs, /* Surrogate */
ucp_Ll, /* Lower case letter */
ucp_Lm, /* Modifier letter */
ucp_Lo, /* Other letter */
ucp_Lt, /* Title case letter */
ucp_Lu, /* Upper case letter */
ucp_Mc, /* Spacing mark */
ucp_Me, /* Enclosing mark */
ucp_Mn, /* Non-spacing mark */
ucp_Nd, /* Decimal number */
ucp_Nl, /* Letter number */
ucp_No, /* Other number */
ucp_Pc, /* Connector punctuation */
ucp_Pd, /* Dash punctuation */
ucp_Pe, /* Close punctuation */
ucp_Pf, /* Final punctuation */
ucp_Pi, /* Initial punctuation */
ucp_Po, /* Other punctuation */
ucp_Ps, /* Open punctuation */
ucp_Sc, /* Currency symbol */
ucp_Sk, /* Modifier symbol */
ucp_Sm, /* Mathematical symbol */
ucp_So, /* Other symbol */
ucp_Zl, /* Line separator */
ucp_Zp, /* Paragraph separator */
ucp_Zs /* Space separator */
};
/* These are the script identifications. */
enum {
ucp_Arabic = G_UNICODE_SCRIPT_ARABIC,
ucp_Armenian = G_UNICODE_SCRIPT_ARMENIAN,
ucp_Bengali = G_UNICODE_SCRIPT_BENGALI,
ucp_Bopomofo = G_UNICODE_SCRIPT_BOPOMOFO,
ucp_Braille = G_UNICODE_SCRIPT_BRAILLE,
ucp_Buginese = G_UNICODE_SCRIPT_BUGINESE,
ucp_Buhid = G_UNICODE_SCRIPT_BUHID,
ucp_Canadian_Aboriginal = G_UNICODE_SCRIPT_CANADIAN_ABORIGINAL,
ucp_Cherokee = G_UNICODE_SCRIPT_CHEROKEE,
ucp_Common = G_UNICODE_SCRIPT_COMMON,
ucp_Coptic = G_UNICODE_SCRIPT_COPTIC,
ucp_Cypriot = G_UNICODE_SCRIPT_CYPRIOT,
ucp_Cyrillic = G_UNICODE_SCRIPT_CYRILLIC,
ucp_Deseret = G_UNICODE_SCRIPT_DESERET,
ucp_Devanagari = G_UNICODE_SCRIPT_DEVANAGARI,
ucp_Ethiopic = G_UNICODE_SCRIPT_ETHIOPIC,
ucp_Georgian = G_UNICODE_SCRIPT_GEORGIAN,
ucp_Glagolitic = G_UNICODE_SCRIPT_GLAGOLITIC,
ucp_Gothic = G_UNICODE_SCRIPT_GOTHIC,
ucp_Greek = G_UNICODE_SCRIPT_GREEK,
ucp_Gujarati = G_UNICODE_SCRIPT_GUJARATI,
ucp_Gurmukhi = G_UNICODE_SCRIPT_GURMUKHI,
ucp_Han = G_UNICODE_SCRIPT_HAN,
ucp_Hangul = G_UNICODE_SCRIPT_HANGUL,
ucp_Hanunoo = G_UNICODE_SCRIPT_HANUNOO,
ucp_Hebrew = G_UNICODE_SCRIPT_HEBREW,
ucp_Hiragana = G_UNICODE_SCRIPT_HIRAGANA,
ucp_Inherited = G_UNICODE_SCRIPT_INHERITED,
ucp_Kannada = G_UNICODE_SCRIPT_KANNADA,
ucp_Katakana = G_UNICODE_SCRIPT_KATAKANA,
ucp_Kharoshthi = G_UNICODE_SCRIPT_KHAROSHTHI,
ucp_Khmer = G_UNICODE_SCRIPT_KHMER,
ucp_Lao = G_UNICODE_SCRIPT_LAO,
ucp_Latin = G_UNICODE_SCRIPT_LATIN,
ucp_Limbu = G_UNICODE_SCRIPT_LIMBU,
ucp_Linear_B = G_UNICODE_SCRIPT_LINEAR_B,
ucp_Malayalam = G_UNICODE_SCRIPT_MALAYALAM,
ucp_Mongolian = G_UNICODE_SCRIPT_MONGOLIAN,
ucp_Myanmar = G_UNICODE_SCRIPT_MYANMAR,
ucp_New_Tai_Lue = G_UNICODE_SCRIPT_NEW_TAI_LUE,
ucp_Ogham = G_UNICODE_SCRIPT_OGHAM,
ucp_Old_Italic = G_UNICODE_SCRIPT_OLD_ITALIC,
ucp_Old_Persian = G_UNICODE_SCRIPT_OLD_PERSIAN,
ucp_Oriya = G_UNICODE_SCRIPT_ORIYA,
ucp_Osmanya = G_UNICODE_SCRIPT_OSMANYA,
ucp_Runic = G_UNICODE_SCRIPT_RUNIC,
ucp_Shavian = G_UNICODE_SCRIPT_SHAVIAN,
ucp_Sinhala = G_UNICODE_SCRIPT_SINHALA,
ucp_Syloti_Nagri = G_UNICODE_SCRIPT_SYLOTI_NAGRI,
ucp_Syriac = G_UNICODE_SCRIPT_SYRIAC,
ucp_Tagalog = G_UNICODE_SCRIPT_TAGALOG,
ucp_Tagbanwa = G_UNICODE_SCRIPT_TAGBANWA,
ucp_Tai_Le = G_UNICODE_SCRIPT_TAI_LE,
ucp_Tamil = G_UNICODE_SCRIPT_TAMIL,
ucp_Telugu = G_UNICODE_SCRIPT_TELUGU,
ucp_Thaana = G_UNICODE_SCRIPT_THAANA,
ucp_Thai = G_UNICODE_SCRIPT_THAI,
ucp_Tibetan = G_UNICODE_SCRIPT_TIBETAN,
ucp_Tifinagh = G_UNICODE_SCRIPT_TIFINAGH,
ucp_Ugaritic = G_UNICODE_SCRIPT_UGARITIC,
ucp_Yi = G_UNICODE_SCRIPT_YI,
ucp_Balinese = G_UNICODE_SCRIPT_BALINESE, /* New for Unicode 5.0.0 */
ucp_Cuneiform = G_UNICODE_SCRIPT_CUNEIFORM, /* New for Unicode 5.0.0 */
ucp_Nko = G_UNICODE_SCRIPT_NKO, /* New for Unicode 5.0.0 */
ucp_Phags_Pa = G_UNICODE_SCRIPT_PHAGS_PA, /* New for Unicode 5.0.0 */
ucp_Phoenician = G_UNICODE_SCRIPT_PHOENICIAN, /* New for Unicode 5.0.0 */
ucp_Carian = G_UNICODE_SCRIPT_CARIAN, /* New for Unicode 5.1 */
ucp_Cham = G_UNICODE_SCRIPT_CHAM, /* New for Unicode 5.1 */
ucp_Kayah_Li = G_UNICODE_SCRIPT_KAYAH_LI, /* New for Unicode 5.1 */
ucp_Lepcha = G_UNICODE_SCRIPT_LEPCHA, /* New for Unicode 5.1 */
ucp_Lycian = G_UNICODE_SCRIPT_LYCIAN, /* New for Unicode 5.1 */
ucp_Lydian = G_UNICODE_SCRIPT_LYDIAN, /* New for Unicode 5.1 */
ucp_Ol_Chiki = G_UNICODE_SCRIPT_OL_CHIKI, /* New for Unicode 5.1 */
ucp_Rejang = G_UNICODE_SCRIPT_REJANG, /* New for Unicode 5.1 */
ucp_Saurashtra = G_UNICODE_SCRIPT_SAURASHTRA, /* New for Unicode 5.1 */
ucp_Sundanese = G_UNICODE_SCRIPT_SUNDANESE, /* New for Unicode 5.1 */
ucp_Vai = G_UNICODE_SCRIPT_VAI /* New for Unicode 5.1 */
};
#endif
/* End of ucp.h */