/[pcre]/code/trunk/ucp.h
ViewVC logotype

Diff of /code/trunk/ucp.h

Parent Directory Parent Directory | Revision Log Revision Log | View Patch Patch

revision 85 by nigel, Sat Feb 24 21:41:13 2007 UTC revision 1011 by ph10, Sat Aug 25 11:36:15 2012 UTC
# Line 1  Line 1 
1  /*************************************************  /*************************************************
2  *     libucp - Unicode Property Table handler    *  *          Unicode Property Table handler        *
3  *************************************************/  *************************************************/
4    
   
5  #ifndef _UCP_H  #ifndef _UCP_H
6  #define _UCP_H  #define _UCP_H
7    
8  /* These are the character categories that are returned by ucp_findchar */  /* This file contains definitions of the property values that are returned by
9    the UCD access macros. New values that are added for new releases of Unicode
10    should always be at the end of each enum, for backwards compatibility.
11    
12    IMPORTANT: Note also that the specific numeric values of the enums have to be
13    the same as the values that are generated by the maint/MultiStage2.py script,
14    where the equivalent property descriptive names are listed in vectors. */
15    
16    /* These are the general character categories. */
17    
18  enum {  enum {
19    ucp_C,     /* Other */    ucp_C,     /* Other */
# Line 18  enum { Line 25  enum {
25    ucp_Z      /* Separator */    ucp_Z      /* Separator */
26  };  };
27    
28  /* These are the detailed character types that are returned by ucp_findchar */  /* These are the particular character categories. */
29    
30  enum {  enum {
31    ucp_Cc,    /* Control */    ucp_Cc,    /* Control */
# Line 53  enum { Line 60  enum {
60    ucp_Zs     /* Space separator */    ucp_Zs     /* Space separator */
61  };  };
62    
63    /* These are grapheme break properties. Note that the code for processing them
64    assumes that the values are less than 16. If more values are added that take
65    the number to 16 or more, the code will have to be rewritten. */
66    
67    enum {
68      ucp_gbCR,             /*  0 */
69      ucp_gbLF,             /*  1 */
70      ucp_gbControl,        /*  2 */
71      ucp_gbExtend,         /*  3 */
72      ucp_gbPrepend,        /*  4 */
73      ucp_gbSpacingMark,    /*  5 */
74      ucp_gbL,              /*  6 Hangul syllable type L */
75      ucp_gbV,              /*  7 Hangul syllable type V */
76      ucp_gbT,              /*  8 Hangul syllable type T */
77      ucp_gbLV,             /*  9 Hangul syllable type LV */
78      ucp_gbLVT,            /* 10 Hangul syllable type LVT */
79      ucp_gbOther,          /* 11 */
80      ucp_gbCount           /* 12 The number of properties */
81    };
82    
83    /* These are the script identifications. */
84    
85    enum {
86      ucp_Arabic,
87      ucp_Armenian,
88      ucp_Bengali,
89      ucp_Bopomofo,
90      ucp_Braille,
91      ucp_Buginese,
92      ucp_Buhid,
93      ucp_Canadian_Aboriginal,
94      ucp_Cherokee,
95      ucp_Common,
96      ucp_Coptic,
97      ucp_Cypriot,
98      ucp_Cyrillic,
99      ucp_Deseret,
100      ucp_Devanagari,
101      ucp_Ethiopic,
102      ucp_Georgian,
103      ucp_Glagolitic,
104      ucp_Gothic,
105      ucp_Greek,
106      ucp_Gujarati,
107      ucp_Gurmukhi,
108      ucp_Han,
109      ucp_Hangul,
110      ucp_Hanunoo,
111      ucp_Hebrew,
112      ucp_Hiragana,
113      ucp_Inherited,
114      ucp_Kannada,
115      ucp_Katakana,
116      ucp_Kharoshthi,
117      ucp_Khmer,
118      ucp_Lao,
119      ucp_Latin,
120      ucp_Limbu,
121      ucp_Linear_B,
122      ucp_Malayalam,
123      ucp_Mongolian,
124      ucp_Myanmar,
125      ucp_New_Tai_Lue,
126      ucp_Ogham,
127      ucp_Old_Italic,
128      ucp_Old_Persian,
129      ucp_Oriya,
130      ucp_Osmanya,
131      ucp_Runic,
132      ucp_Shavian,
133      ucp_Sinhala,
134      ucp_Syloti_Nagri,
135      ucp_Syriac,
136      ucp_Tagalog,
137      ucp_Tagbanwa,
138      ucp_Tai_Le,
139      ucp_Tamil,
140      ucp_Telugu,
141      ucp_Thaana,
142      ucp_Thai,
143      ucp_Tibetan,
144      ucp_Tifinagh,
145      ucp_Ugaritic,
146      ucp_Yi,
147      /* New for Unicode 5.0: */
148      ucp_Balinese,
149      ucp_Cuneiform,
150      ucp_Nko,
151      ucp_Phags_Pa,
152      ucp_Phoenician,
153      /* New for Unicode 5.1: */
154      ucp_Carian,
155      ucp_Cham,
156      ucp_Kayah_Li,
157      ucp_Lepcha,
158      ucp_Lycian,
159      ucp_Lydian,
160      ucp_Ol_Chiki,
161      ucp_Rejang,
162      ucp_Saurashtra,
163      ucp_Sundanese,
164      ucp_Vai,
165      /* New for Unicode 5.2: */
166      ucp_Avestan,
167      ucp_Bamum,
168      ucp_Egyptian_Hieroglyphs,
169      ucp_Imperial_Aramaic,
170      ucp_Inscriptional_Pahlavi,
171      ucp_Inscriptional_Parthian,
172      ucp_Javanese,
173      ucp_Kaithi,
174      ucp_Lisu,
175      ucp_Meetei_Mayek,
176      ucp_Old_South_Arabian,
177      ucp_Old_Turkic,
178      ucp_Samaritan,
179      ucp_Tai_Tham,
180      ucp_Tai_Viet,
181      /* New for Unicode 6.0.0: */
182      ucp_Batak,
183      ucp_Brahmi,
184      ucp_Mandaic,
185      /* New for Unicode 6.1.0: */
186      ucp_Chakma,
187      ucp_Meroitic_Cursive,
188      ucp_Meroitic_Hieroglyphs,
189      ucp_Miao,
190      ucp_Sharada,
191      ucp_Sora_Sompeng,
192      ucp_Takri
193    };
194    
195  #endif  #endif
196    
197  /* End of ucp.h */  /* End of ucp.h */

Legend:
Removed from v.85  
changed lines
  Added in v.1011

  ViewVC Help
Powered by ViewVC 1.1.5