ROOT_528-00b_version: core/pcre/src/pcre-7.8/ucp.h Source File

00001 /*************************************************
00002 *          Unicode Property Table handler        *
00003 *************************************************/
00004 
00005 #ifndef _UCP_H
00006 #define _UCP_H
00007 
00008 /* This file contains definitions of the property values that are returned by
00009 the function _pcre_ucp_findprop(). New values that are added for new releases
00010 of Unicode should always be at the end of each enum, for backwards
00011 compatibility. */
00012 
00013 /* These are the general character categories. */
00014 
00015 enum {
00016   ucp_C,     /* Other */
00017   ucp_L,     /* Letter */
00018   ucp_M,     /* Mark */
00019   ucp_N,     /* Number */
00020   ucp_P,     /* Punctuation */
00021   ucp_S,     /* Symbol */
00022   ucp_Z      /* Separator */
00023 };
00024 
00025 /* These are the particular character types. */
00026 
00027 enum {
00028   ucp_Cc,    /* Control */
00029   ucp_Cf,    /* Format */
00030   ucp_Cn,    /* Unassigned */
00031   ucp_Co,    /* Private use */
00032   ucp_Cs,    /* Surrogate */
00033   ucp_Ll,    /* Lower case letter */
00034   ucp_Lm,    /* Modifier letter */
00035   ucp_Lo,    /* Other letter */
00036   ucp_Lt,    /* Title case letter */
00037   ucp_Lu,    /* Upper case letter */
00038   ucp_Mc,    /* Spacing mark */
00039   ucp_Me,    /* Enclosing mark */
00040   ucp_Mn,    /* Non-spacing mark */
00041   ucp_Nd,    /* Decimal number */
00042   ucp_Nl,    /* Letter number */
00043   ucp_No,    /* Other number */
00044   ucp_Pc,    /* Connector punctuation */
00045   ucp_Pd,    /* Dash punctuation */
00046   ucp_Pe,    /* Close punctuation */
00047   ucp_Pf,    /* Final punctuation */
00048   ucp_Pi,    /* Initial punctuation */
00049   ucp_Po,    /* Other punctuation */
00050   ucp_Ps,    /* Open punctuation */
00051   ucp_Sc,    /* Currency symbol */
00052   ucp_Sk,    /* Modifier symbol */
00053   ucp_Sm,    /* Mathematical symbol */
00054   ucp_So,    /* Other symbol */
00055   ucp_Zl,    /* Line separator */
00056   ucp_Zp,    /* Paragraph separator */
00057   ucp_Zs     /* Space separator */
00058 };
00059 
00060 /* These are the script identifications. */
00061 
00062 enum {
00063   ucp_Arabic,
00064   ucp_Armenian,
00065   ucp_Bengali,
00066   ucp_Bopomofo,
00067   ucp_Braille,
00068   ucp_Buginese,
00069   ucp_Buhid,
00070   ucp_Canadian_Aboriginal,
00071   ucp_Cherokee,
00072   ucp_Common,
00073   ucp_Coptic,
00074   ucp_Cypriot,
00075   ucp_Cyrillic,
00076   ucp_Deseret,
00077   ucp_Devanagari,
00078   ucp_Ethiopic,
00079   ucp_Georgian,
00080   ucp_Glagolitic,
00081   ucp_Gothic,
00082   ucp_Greek,
00083   ucp_Gujarati,
00084   ucp_Gurmukhi,
00085   ucp_Han,
00086   ucp_Hangul,
00087   ucp_Hanunoo,
00088   ucp_Hebrew,
00089   ucp_Hiragana,
00090   ucp_Inherited,
00091   ucp_Kannada,
00092   ucp_Katakana,
00093   ucp_Kharoshthi,
00094   ucp_Khmer,
00095   ucp_Lao,
00096   ucp_Latin,
00097   ucp_Limbu,
00098   ucp_Linear_B,
00099   ucp_Malayalam,
00100   ucp_Mongolian,
00101   ucp_Myanmar,
00102   ucp_New_Tai_Lue,
00103   ucp_Ogham,
00104   ucp_Old_Italic,
00105   ucp_Old_Persian,
00106   ucp_Oriya,
00107   ucp_Osmanya,
00108   ucp_Runic,
00109   ucp_Shavian,
00110   ucp_Sinhala,
00111   ucp_Syloti_Nagri,
00112   ucp_Syriac,
00113   ucp_Tagalog,
00114   ucp_Tagbanwa,
00115   ucp_Tai_Le,
00116   ucp_Tamil,
00117   ucp_Telugu,
00118   ucp_Thaana,
00119   ucp_Thai,
00120   ucp_Tibetan,
00121   ucp_Tifinagh,
00122   ucp_Ugaritic,
00123   ucp_Yi,
00124   /* New for Unicode 5.0: */
00125   ucp_Balinese,
00126   ucp_Cuneiform,
00127   ucp_Nko,
00128   ucp_Phags_Pa,
00129   ucp_Phoenician,
00130   /* New for Unicode 5.1: */
00131   ucp_Carian,
00132   ucp_Cham,
00133   ucp_Kayah_Li,
00134   ucp_Lepcha,
00135   ucp_Lycian,
00136   ucp_Lydian,
00137   ucp_Ol_Chiki,
00138   ucp_Rejang,
00139   ucp_Saurashtra,
00140   ucp_Sundanese,
00141   ucp_Vai
00142 };
00143 
00144 #endif
00145 
00146 /* End of ucp.h */