1 | /* |
2 | * Copyright © 2009 Red Hat, Inc. |
3 | * Copyright © 2011 Codethink Limited |
4 | * Copyright © 2011,2012 Google, Inc. |
5 | * |
6 | * This is part of HarfBuzz, a text shaping library. |
7 | * |
8 | * Permission is hereby granted, without written agreement and without |
9 | * license or royalty fees, to use, copy, modify, and distribute this |
10 | * software and its documentation for any purpose, provided that the |
11 | * above copyright notice and the following two paragraphs appear in |
12 | * all copies of this software. |
13 | * |
14 | * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR |
15 | * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES |
16 | * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN |
17 | * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH |
18 | * DAMAGE. |
19 | * |
20 | * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, |
21 | * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND |
22 | * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS |
23 | * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO |
24 | * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. |
25 | * |
26 | * Red Hat Author(s): Behdad Esfahbod |
27 | * Codethink Author(s): Ryan Lortie |
28 | * Google Author(s): Behdad Esfahbod |
29 | */ |
30 | |
31 | #ifndef HB_H_IN |
32 | #error "Include <hb.h> instead." |
33 | #endif |
34 | |
35 | #ifndef HB_UNICODE_H |
36 | #define HB_UNICODE_H |
37 | |
38 | #include "hb-common.h" |
39 | |
40 | HB_BEGIN_DECLS |
41 | |
42 | |
43 | /** |
44 | * HB_UNICODE_MAX |
45 | * |
46 | * Since: 1.9.0 |
47 | **/ |
48 | #define HB_UNICODE_MAX 0x10FFFFu |
49 | |
50 | |
51 | /* hb_unicode_general_category_t */ |
52 | |
53 | /* Unicode Character Database property: General_Category (gc) */ |
54 | typedef enum |
55 | { |
56 | HB_UNICODE_GENERAL_CATEGORY_CONTROL, /* Cc */ |
57 | HB_UNICODE_GENERAL_CATEGORY_FORMAT, /* Cf */ |
58 | HB_UNICODE_GENERAL_CATEGORY_UNASSIGNED, /* Cn */ |
59 | HB_UNICODE_GENERAL_CATEGORY_PRIVATE_USE, /* Co */ |
60 | HB_UNICODE_GENERAL_CATEGORY_SURROGATE, /* Cs */ |
61 | HB_UNICODE_GENERAL_CATEGORY_LOWERCASE_LETTER, /* Ll */ |
62 | HB_UNICODE_GENERAL_CATEGORY_MODIFIER_LETTER, /* Lm */ |
63 | HB_UNICODE_GENERAL_CATEGORY_OTHER_LETTER, /* Lo */ |
64 | HB_UNICODE_GENERAL_CATEGORY_TITLECASE_LETTER, /* Lt */ |
65 | HB_UNICODE_GENERAL_CATEGORY_UPPERCASE_LETTER, /* Lu */ |
66 | HB_UNICODE_GENERAL_CATEGORY_SPACING_MARK, /* Mc */ |
67 | HB_UNICODE_GENERAL_CATEGORY_ENCLOSING_MARK, /* Me */ |
68 | HB_UNICODE_GENERAL_CATEGORY_NON_SPACING_MARK, /* Mn */ |
69 | HB_UNICODE_GENERAL_CATEGORY_DECIMAL_NUMBER, /* Nd */ |
70 | HB_UNICODE_GENERAL_CATEGORY_LETTER_NUMBER, /* Nl */ |
71 | HB_UNICODE_GENERAL_CATEGORY_OTHER_NUMBER, /* No */ |
72 | HB_UNICODE_GENERAL_CATEGORY_CONNECT_PUNCTUATION, /* Pc */ |
73 | HB_UNICODE_GENERAL_CATEGORY_DASH_PUNCTUATION, /* Pd */ |
74 | HB_UNICODE_GENERAL_CATEGORY_CLOSE_PUNCTUATION, /* Pe */ |
75 | HB_UNICODE_GENERAL_CATEGORY_FINAL_PUNCTUATION, /* Pf */ |
76 | HB_UNICODE_GENERAL_CATEGORY_INITIAL_PUNCTUATION, /* Pi */ |
77 | HB_UNICODE_GENERAL_CATEGORY_OTHER_PUNCTUATION, /* Po */ |
78 | HB_UNICODE_GENERAL_CATEGORY_OPEN_PUNCTUATION, /* Ps */ |
79 | HB_UNICODE_GENERAL_CATEGORY_CURRENCY_SYMBOL, /* Sc */ |
80 | HB_UNICODE_GENERAL_CATEGORY_MODIFIER_SYMBOL, /* Sk */ |
81 | HB_UNICODE_GENERAL_CATEGORY_MATH_SYMBOL, /* Sm */ |
82 | HB_UNICODE_GENERAL_CATEGORY_OTHER_SYMBOL, /* So */ |
83 | HB_UNICODE_GENERAL_CATEGORY_LINE_SEPARATOR, /* Zl */ |
84 | HB_UNICODE_GENERAL_CATEGORY_PARAGRAPH_SEPARATOR, /* Zp */ |
85 | HB_UNICODE_GENERAL_CATEGORY_SPACE_SEPARATOR /* Zs */ |
86 | } hb_unicode_general_category_t; |
87 | |
88 | /* hb_unicode_combining_class_t */ |
89 | |
90 | /* Note: newer versions of Unicode may add new values. Clients should be ready to handle |
91 | * any value in the 0..254 range being returned from hb_unicode_combining_class(). |
92 | */ |
93 | |
94 | /* Unicode Character Database property: Canonical_Combining_Class (ccc) */ |
95 | typedef enum |
96 | { |
97 | HB_UNICODE_COMBINING_CLASS_NOT_REORDERED = 0, |
98 | HB_UNICODE_COMBINING_CLASS_OVERLAY = 1, |
99 | HB_UNICODE_COMBINING_CLASS_NUKTA = 7, |
100 | HB_UNICODE_COMBINING_CLASS_KANA_VOICING = 8, |
101 | HB_UNICODE_COMBINING_CLASS_VIRAMA = 9, |
102 | |
103 | /* Hebrew */ |
104 | HB_UNICODE_COMBINING_CLASS_CCC10 = 10, |
105 | HB_UNICODE_COMBINING_CLASS_CCC11 = 11, |
106 | HB_UNICODE_COMBINING_CLASS_CCC12 = 12, |
107 | HB_UNICODE_COMBINING_CLASS_CCC13 = 13, |
108 | HB_UNICODE_COMBINING_CLASS_CCC14 = 14, |
109 | HB_UNICODE_COMBINING_CLASS_CCC15 = 15, |
110 | HB_UNICODE_COMBINING_CLASS_CCC16 = 16, |
111 | HB_UNICODE_COMBINING_CLASS_CCC17 = 17, |
112 | HB_UNICODE_COMBINING_CLASS_CCC18 = 18, |
113 | HB_UNICODE_COMBINING_CLASS_CCC19 = 19, |
114 | HB_UNICODE_COMBINING_CLASS_CCC20 = 20, |
115 | HB_UNICODE_COMBINING_CLASS_CCC21 = 21, |
116 | HB_UNICODE_COMBINING_CLASS_CCC22 = 22, |
117 | HB_UNICODE_COMBINING_CLASS_CCC23 = 23, |
118 | HB_UNICODE_COMBINING_CLASS_CCC24 = 24, |
119 | HB_UNICODE_COMBINING_CLASS_CCC25 = 25, |
120 | HB_UNICODE_COMBINING_CLASS_CCC26 = 26, |
121 | |
122 | /* Arabic */ |
123 | HB_UNICODE_COMBINING_CLASS_CCC27 = 27, |
124 | HB_UNICODE_COMBINING_CLASS_CCC28 = 28, |
125 | HB_UNICODE_COMBINING_CLASS_CCC29 = 29, |
126 | HB_UNICODE_COMBINING_CLASS_CCC30 = 30, |
127 | HB_UNICODE_COMBINING_CLASS_CCC31 = 31, |
128 | HB_UNICODE_COMBINING_CLASS_CCC32 = 32, |
129 | HB_UNICODE_COMBINING_CLASS_CCC33 = 33, |
130 | HB_UNICODE_COMBINING_CLASS_CCC34 = 34, |
131 | HB_UNICODE_COMBINING_CLASS_CCC35 = 35, |
132 | |
133 | /* Syriac */ |
134 | HB_UNICODE_COMBINING_CLASS_CCC36 = 36, |
135 | |
136 | /* Telugu */ |
137 | HB_UNICODE_COMBINING_CLASS_CCC84 = 84, |
138 | HB_UNICODE_COMBINING_CLASS_CCC91 = 91, |
139 | |
140 | /* Thai */ |
141 | HB_UNICODE_COMBINING_CLASS_CCC103 = 103, |
142 | HB_UNICODE_COMBINING_CLASS_CCC107 = 107, |
143 | |
144 | /* Lao */ |
145 | HB_UNICODE_COMBINING_CLASS_CCC118 = 118, |
146 | HB_UNICODE_COMBINING_CLASS_CCC122 = 122, |
147 | |
148 | /* Tibetan */ |
149 | HB_UNICODE_COMBINING_CLASS_CCC129 = 129, |
150 | HB_UNICODE_COMBINING_CLASS_CCC130 = 130, |
151 | HB_UNICODE_COMBINING_CLASS_CCC133 = 132, |
152 | |
153 | |
154 | HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW_LEFT = 200, |
155 | HB_UNICODE_COMBINING_CLASS_ATTACHED_BELOW = 202, |
156 | HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE = 214, |
157 | HB_UNICODE_COMBINING_CLASS_ATTACHED_ABOVE_RIGHT = 216, |
158 | HB_UNICODE_COMBINING_CLASS_BELOW_LEFT = 218, |
159 | HB_UNICODE_COMBINING_CLASS_BELOW = 220, |
160 | HB_UNICODE_COMBINING_CLASS_BELOW_RIGHT = 222, |
161 | HB_UNICODE_COMBINING_CLASS_LEFT = 224, |
162 | HB_UNICODE_COMBINING_CLASS_RIGHT = 226, |
163 | HB_UNICODE_COMBINING_CLASS_ABOVE_LEFT = 228, |
164 | HB_UNICODE_COMBINING_CLASS_ABOVE = 230, |
165 | HB_UNICODE_COMBINING_CLASS_ABOVE_RIGHT = 232, |
166 | HB_UNICODE_COMBINING_CLASS_DOUBLE_BELOW = 233, |
167 | HB_UNICODE_COMBINING_CLASS_DOUBLE_ABOVE = 234, |
168 | |
169 | HB_UNICODE_COMBINING_CLASS_IOTA_SUBSCRIPT = 240, |
170 | |
171 | HB_UNICODE_COMBINING_CLASS_INVALID = 255 |
172 | } hb_unicode_combining_class_t; |
173 | |
174 | |
175 | /* |
176 | * hb_unicode_funcs_t |
177 | */ |
178 | |
179 | typedef struct hb_unicode_funcs_t hb_unicode_funcs_t; |
180 | |
181 | |
182 | /* |
183 | * just give me the best implementation you've got there. |
184 | */ |
185 | HB_EXTERN hb_unicode_funcs_t * |
186 | hb_unicode_funcs_get_default (void); |
187 | |
188 | |
189 | HB_EXTERN hb_unicode_funcs_t * |
190 | hb_unicode_funcs_create (hb_unicode_funcs_t *parent); |
191 | |
192 | HB_EXTERN hb_unicode_funcs_t * |
193 | hb_unicode_funcs_get_empty (void); |
194 | |
195 | HB_EXTERN hb_unicode_funcs_t * |
196 | hb_unicode_funcs_reference (hb_unicode_funcs_t *ufuncs); |
197 | |
198 | HB_EXTERN void |
199 | hb_unicode_funcs_destroy (hb_unicode_funcs_t *ufuncs); |
200 | |
201 | HB_EXTERN hb_bool_t |
202 | hb_unicode_funcs_set_user_data (hb_unicode_funcs_t *ufuncs, |
203 | hb_user_data_key_t *key, |
204 | void * data, |
205 | hb_destroy_func_t destroy, |
206 | hb_bool_t replace); |
207 | |
208 | |
209 | HB_EXTERN void * |
210 | hb_unicode_funcs_get_user_data (hb_unicode_funcs_t *ufuncs, |
211 | hb_user_data_key_t *key); |
212 | |
213 | |
214 | HB_EXTERN void |
215 | hb_unicode_funcs_make_immutable (hb_unicode_funcs_t *ufuncs); |
216 | |
217 | HB_EXTERN hb_bool_t |
218 | hb_unicode_funcs_is_immutable (hb_unicode_funcs_t *ufuncs); |
219 | |
220 | HB_EXTERN hb_unicode_funcs_t * |
221 | hb_unicode_funcs_get_parent (hb_unicode_funcs_t *ufuncs); |
222 | |
223 | |
224 | /* |
225 | * funcs |
226 | */ |
227 | |
228 | /* typedefs */ |
229 | |
230 | typedef hb_unicode_combining_class_t (*hb_unicode_combining_class_func_t) (hb_unicode_funcs_t *ufuncs, |
231 | hb_codepoint_t unicode, |
232 | void *user_data); |
233 | typedef hb_unicode_general_category_t (*hb_unicode_general_category_func_t) (hb_unicode_funcs_t *ufuncs, |
234 | hb_codepoint_t unicode, |
235 | void *user_data); |
236 | typedef hb_codepoint_t (*hb_unicode_mirroring_func_t) (hb_unicode_funcs_t *ufuncs, |
237 | hb_codepoint_t unicode, |
238 | void *user_data); |
239 | typedef hb_script_t (*hb_unicode_script_func_t) (hb_unicode_funcs_t *ufuncs, |
240 | hb_codepoint_t unicode, |
241 | void *user_data); |
242 | |
243 | typedef hb_bool_t (*hb_unicode_compose_func_t) (hb_unicode_funcs_t *ufuncs, |
244 | hb_codepoint_t a, |
245 | hb_codepoint_t b, |
246 | hb_codepoint_t *ab, |
247 | void *user_data); |
248 | typedef hb_bool_t (*hb_unicode_decompose_func_t) (hb_unicode_funcs_t *ufuncs, |
249 | hb_codepoint_t ab, |
250 | hb_codepoint_t *a, |
251 | hb_codepoint_t *b, |
252 | void *user_data); |
253 | |
254 | /* setters */ |
255 | |
256 | /** |
257 | * hb_unicode_funcs_set_combining_class_func: |
258 | * @ufuncs: a Unicode function structure |
259 | * @func: (closure user_data) (destroy destroy) (scope notified): |
260 | * @user_data: |
261 | * @destroy: |
262 | * |
263 | * |
264 | * |
265 | * Since: 0.9.2 |
266 | **/ |
267 | HB_EXTERN void |
268 | hb_unicode_funcs_set_combining_class_func (hb_unicode_funcs_t *ufuncs, |
269 | hb_unicode_combining_class_func_t func, |
270 | void *user_data, hb_destroy_func_t destroy); |
271 | |
272 | /** |
273 | * hb_unicode_funcs_set_general_category_func: |
274 | * @ufuncs: a Unicode function structure |
275 | * @func: (closure user_data) (destroy destroy) (scope notified): |
276 | * @user_data: |
277 | * @destroy: |
278 | * |
279 | * |
280 | * |
281 | * Since: 0.9.2 |
282 | **/ |
283 | HB_EXTERN void |
284 | hb_unicode_funcs_set_general_category_func (hb_unicode_funcs_t *ufuncs, |
285 | hb_unicode_general_category_func_t func, |
286 | void *user_data, hb_destroy_func_t destroy); |
287 | |
288 | /** |
289 | * hb_unicode_funcs_set_mirroring_func: |
290 | * @ufuncs: a Unicode function structure |
291 | * @func: (closure user_data) (destroy destroy) (scope notified): |
292 | * @user_data: |
293 | * @destroy: |
294 | * |
295 | * |
296 | * |
297 | * Since: 0.9.2 |
298 | **/ |
299 | HB_EXTERN void |
300 | hb_unicode_funcs_set_mirroring_func (hb_unicode_funcs_t *ufuncs, |
301 | hb_unicode_mirroring_func_t func, |
302 | void *user_data, hb_destroy_func_t destroy); |
303 | |
304 | /** |
305 | * hb_unicode_funcs_set_script_func: |
306 | * @ufuncs: a Unicode function structure |
307 | * @func: (closure user_data) (destroy destroy) (scope notified): |
308 | * @user_data: |
309 | * @destroy: |
310 | * |
311 | * |
312 | * |
313 | * Since: 0.9.2 |
314 | **/ |
315 | HB_EXTERN void |
316 | hb_unicode_funcs_set_script_func (hb_unicode_funcs_t *ufuncs, |
317 | hb_unicode_script_func_t func, |
318 | void *user_data, hb_destroy_func_t destroy); |
319 | |
320 | /** |
321 | * hb_unicode_funcs_set_compose_func: |
322 | * @ufuncs: a Unicode function structure |
323 | * @func: (closure user_data) (destroy destroy) (scope notified): |
324 | * @user_data: |
325 | * @destroy: |
326 | * |
327 | * |
328 | * |
329 | * Since: 0.9.2 |
330 | **/ |
331 | HB_EXTERN void |
332 | hb_unicode_funcs_set_compose_func (hb_unicode_funcs_t *ufuncs, |
333 | hb_unicode_compose_func_t func, |
334 | void *user_data, hb_destroy_func_t destroy); |
335 | |
336 | /** |
337 | * hb_unicode_funcs_set_decompose_func: |
338 | * @ufuncs: a Unicode function structure |
339 | * @func: (closure user_data) (destroy destroy) (scope notified): |
340 | * @user_data: |
341 | * @destroy: |
342 | * |
343 | * |
344 | * |
345 | * Since: 0.9.2 |
346 | **/ |
347 | HB_EXTERN void |
348 | hb_unicode_funcs_set_decompose_func (hb_unicode_funcs_t *ufuncs, |
349 | hb_unicode_decompose_func_t func, |
350 | void *user_data, hb_destroy_func_t destroy); |
351 | |
352 | /* accessors */ |
353 | |
354 | /** |
355 | * hb_unicode_combining_class: |
356 | * |
357 | * Since: 0.9.2 |
358 | **/ |
359 | HB_EXTERN hb_unicode_combining_class_t |
360 | hb_unicode_combining_class (hb_unicode_funcs_t *ufuncs, |
361 | hb_codepoint_t unicode); |
362 | |
363 | /** |
364 | * hb_unicode_general_category: |
365 | * |
366 | * Since: 0.9.2 |
367 | **/ |
368 | HB_EXTERN hb_unicode_general_category_t |
369 | hb_unicode_general_category (hb_unicode_funcs_t *ufuncs, |
370 | hb_codepoint_t unicode); |
371 | |
372 | /** |
373 | * hb_unicode_mirroring: |
374 | * |
375 | * Since: 0.9.2 |
376 | **/ |
377 | HB_EXTERN hb_codepoint_t |
378 | hb_unicode_mirroring (hb_unicode_funcs_t *ufuncs, |
379 | hb_codepoint_t unicode); |
380 | |
381 | /** |
382 | * hb_unicode_script: |
383 | * |
384 | * Since: 0.9.2 |
385 | **/ |
386 | HB_EXTERN hb_script_t |
387 | hb_unicode_script (hb_unicode_funcs_t *ufuncs, |
388 | hb_codepoint_t unicode); |
389 | |
390 | HB_EXTERN hb_bool_t |
391 | hb_unicode_compose (hb_unicode_funcs_t *ufuncs, |
392 | hb_codepoint_t a, |
393 | hb_codepoint_t b, |
394 | hb_codepoint_t *ab); |
395 | |
396 | HB_EXTERN hb_bool_t |
397 | hb_unicode_decompose (hb_unicode_funcs_t *ufuncs, |
398 | hb_codepoint_t ab, |
399 | hb_codepoint_t *a, |
400 | hb_codepoint_t *b); |
401 | |
402 | HB_END_DECLS |
403 | |
404 | #endif /* HB_UNICODE_H */ |
405 | |