1/*
2 * Copyright © 2013 Ran Benita
3 *
4 * Permission is hereby granted, free of charge, to any person obtaining a
5 * copy of this software and associated documentation files (the "Software"),
6 * to deal in the Software without restriction, including without limitation
7 * the rights to use, copy, modify, merge, publish, distribute, sublicense,
8 * and/or sell copies of the Software, and to permit persons to whom the
9 * Software is furnished to do so, subject to the following conditions:
10 *
11 * The above copyright notice and this permission notice (including the next
12 * paragraph) shall be included in all copies or substantial portions of the
13 * Software.
14 *
15 * THE SOFTWARE IS PROVIDED "AS IS", WITHOUT WARRANTY OF ANY KIND, EXPRESS OR
16 * IMPLIED, INCLUDING BUT NOT LIMITED TO THE WARRANTIES OF MERCHANTABILITY,
17 * FITNESS FOR A PARTICULAR PURPOSE AND NONINFRINGEMENT. IN NO EVENT SHALL
18 * THE AUTHORS OR COPYRIGHT HOLDERS BE LIABLE FOR ANY CLAIM, DAMAGES OR OTHER
19 * LIABILITY, WHETHER IN AN ACTION OF CONTRACT, TORT OR OTHERWISE, ARISING
20 * FROM, OUT OF OR IN CONNECTION WITH THE SOFTWARE OR THE USE OR OTHER
21 * DEALINGS IN THE SOFTWARE.
22 */
23
24#ifndef _XKBCOMMON_COMPOSE_H
25#define _XKBCOMMON_COMPOSE_H
26
27#include <xkbcommon/xkbcommon.h>
28
29#ifdef __cplusplus
30extern "C" {
31#endif
32
33/**
34 * @file
35 * libxkbcommon Compose API - support for Compose and dead-keys.
36 */
37
38/**
39 * @defgroup compose Compose and dead-keys support
40 * Support for Compose and dead-keys.
41 * @since 0.5.0
42 *
43 * @{
44 */
45
46/**
47 * @page compose-overview Overview
48 * @parblock
49 *
50 * Compose and dead-keys are a common feature of many keyboard input
51 * systems. They extend the range of the keysysm that can be produced
52 * directly from a keyboard by using a sequence of key strokes, instead
53 * of just one.
54 *
55 * Here are some example sequences, in the libX11 Compose file format:
56 *
57 * <dead_acute> <a> : "á" aacute # LATIN SMALL LETTER A WITH ACUTE
58 * <Multi_key> <A> <T> : "@" at # COMMERCIAL AT
59 *
60 * When the user presses a key which produces the `<dead_acute>` keysym,
61 * nothing initially happens (thus the key is dubbed a "dead-key"). But
62 * when the user enters `<a>`, "á" is "composed", in place of "a". If
63 * instead the user had entered a keysym which does not follow
64 * `<dead_acute>` in any compose sequence, the sequence is said to be
65 * "cancelled".
66 *
67 * Compose files define many such sequences. For a description of the
68 * common file format for Compose files, see the Compose(5) man page.
69 *
70 * A successfuly-composed sequence has two results: a keysym and a UTF-8
71 * string. At least one of the two is defined for each sequence. If only
72 * a keysym is given, the keysym's string representation is used for the
73 * result string (using xkb_keysym_to_utf8()).
74 *
75 * This library provides low-level support for Compose file parsing and
76 * processing. Higher-level APIs (such as libX11's `Xutf8LookupString`(3))
77 * may be built upon it, or it can be used directly.
78 *
79 * @endparblock
80 */
81
82/**
83 * @page compose-conflicting Conflicting Sequences
84 * @parblock
85 *
86 * To avoid ambiguity, a sequence is not allowed to be a prefix of another.
87 * In such a case, the conflict is resolved thus:
88 *
89 * 1. A longer sequence overrides a shorter one.
90 * 2. An equal sequence overrides an existing one.
91 * 3. A shorter sequence does not override a longer one.
92 *
93 * Sequences of length 1 are allowed.
94 *
95 * @endparblock
96 */
97
98/**
99 * @page compose-cancellation Cancellation Behavior
100 * @parblock
101 *
102 * What should happen when a sequence is cancelled? For example, consider
103 * there are only the above sequences, and the input keysyms are
104 * `<dead_acute> <b>`. There are a few approaches:
105 *
106 * 1. Swallow the cancelling keysym; that is, no keysym is produced.
107 * This is the approach taken by libX11.
108 * 2. Let the cancelling keysym through; that is, `<b>` is produced.
109 * 3. Replay the entire sequence; that is, `<dead_acute> <b>` is produced.
110 * This is the approach taken by Microsoft Windows (approximately;
111 * instead of `<dead_acute>`, the underlying key is used. This is
112 * difficult to simulate with XKB keymaps).
113 *
114 * You can program whichever approach best fits users' expectations.
115 *
116 * @endparblock
117 */
118
119/**
120 * @struct xkb_compose_table
121 * Opaque Compose table object.
122 *
123 * The compose table holds the definitions of the Compose sequences, as
124 * gathered from Compose files. It is immutable.
125 */
126struct xkb_compose_table;
127
128/**
129 * @struct xkb_compose_state
130 * Opaque Compose state object.
131 *
132 * The compose state maintains state for compose sequence matching, such
133 * as which possible sequences are being matched, and the position within
134 * these sequences. It acts as a simple state machine wherein keysyms are
135 * the input, and composed keysyms and strings are the output.
136 *
137 * The compose state is usually associated with a keyboard device.
138 */
139struct xkb_compose_state;
140
141/** Flags affecting Compose file compilation. */
142enum xkb_compose_compile_flags {
143 /** Do not apply any flags. */
144 XKB_COMPOSE_COMPILE_NO_FLAGS = 0
145};
146
147/** The recognized Compose file formats. */
148enum xkb_compose_format {
149 /** The classic libX11 Compose text format, described in Compose(5). */
150 XKB_COMPOSE_FORMAT_TEXT_V1 = 1
151};
152
153/**
154 * @page compose-locale Compose Locale
155 * @parblock
156 *
157 * Compose files are locale dependent:
158 * - Compose files are written for a locale, and the locale is used when
159 * searching for the appropriate file to use.
160 * - Compose files may reference the locale internally, with directives
161 * such as \%L.
162 *
163 * As such, functions like xkb_compose_table_new_from_locale() require
164 * a `locale` parameter. This will usually be the current locale (see
165 * locale(7) for more details). You may also want to allow the user to
166 * explicitly configure it, so he can use the Compose file of a given
167 * locale, but not use that locale for other things.
168 *
169 * You may query the current locale as follows:
170 * @code
171 * const char *locale;
172 * locale = setlocale(LC_CTYPE, NULL);
173 * @endcode
174 *
175 * This will only give useful results if the program had previously set
176 * the current locale using setlocale(3), with `LC_CTYPE` or `LC_ALL`
177 * and a non-NULL argument.
178 *
179 * If you prefer not to use the locale system of the C runtime library,
180 * you may nevertheless obtain the user's locale directly using
181 * environment variables, as described in locale(7). For example,
182 * @code
183 * const char *locale;
184 * locale = getenv("LC_ALL");
185 * if (!locale || !*locale)
186 * locale = getenv("LC_CTYPE");
187 * if (!locale || !*locale)
188 * locale = getenv("LANG");
189 * if (!locale || !*locale)
190 * locale = "C";
191 * @endcode
192 *
193 * Note that some locales supported by the C standard library may not
194 * have a Compose file assigned.
195 *
196 * @endparblock
197 */
198
199/**
200 * Create a compose table for a given locale.
201 *
202 * The locale is used for searching the file-system for an appropriate
203 * Compose file. The search order is described in Compose(5). It is
204 * affected by the following environment variables:
205 *
206 * 1. `XCOMPOSEFILE` - see Compose(5).
207 * 2. `HOME` - see Compose(5).
208 * 3. `XLOCALEDIR` - if set, used as the base directory for the system's
209 * X locale files, e.g. `/usr/share/X11/locale`, instead of the
210 * preconfigured directory.
211 *
212 * @param context
213 * The library context in which to create the compose table.
214 * @param locale
215 * The current locale. See @ref compose-locale.\n
216 *
217 * The value is copied, so it is safe to pass the result of getenv(3)
218 * (or similar) without fear of it being invalidated by a subsequent
219 * setenv(3) (or similar).
220 * @param flags
221 * Optional flags for the compose table, or 0.
222 *
223 * @returns A compose table for the given locale, or NULL if the
224 * compilation failed or a Compose file was not found.
225 *
226 * @memberof xkb_compose_table
227 */
228struct xkb_compose_table *
229xkb_compose_table_new_from_locale(struct xkb_context *context,
230 const char *locale,
231 enum xkb_compose_compile_flags flags);
232
233/**
234 * Create a new compose table from a Compose file.
235 *
236 * @param context
237 * The library context in which to create the compose table.
238 * @param file
239 * The Compose file to compile.
240 * @param locale
241 * The current locale. See @ref compose-locale.
242 * @param format
243 * The text format of the Compose file to compile.
244 * @param flags
245 * Optional flags for the compose table, or 0.
246 *
247 * @returns A compose table compiled from the given file, or NULL if
248 * the compilation failed.
249 *
250 * @memberof xkb_compose_table
251 */
252struct xkb_compose_table *
253xkb_compose_table_new_from_file(struct xkb_context *context,
254 FILE *file,
255 const char *locale,
256 enum xkb_compose_format format,
257 enum xkb_compose_compile_flags flags);
258
259/**
260 * Create a new compose table from a memory buffer.
261 *
262 * This is just like xkb_compose_table_new_from_file(), but instead of
263 * a file, gets the table as one enormous string.
264 *
265 * @see xkb_compose_table_new_from_file()
266 * @memberof xkb_compose_table
267 */
268struct xkb_compose_table *
269xkb_compose_table_new_from_buffer(struct xkb_context *context,
270 const char *buffer, size_t length,
271 const char *locale,
272 enum xkb_compose_format format,
273 enum xkb_compose_compile_flags flags);
274
275/**
276 * Take a new reference on a compose table.
277 *
278 * @returns The passed in object.
279 *
280 * @memberof xkb_compose_table
281 */
282struct xkb_compose_table *
283xkb_compose_table_ref(struct xkb_compose_table *table);
284
285/**
286 * Release a reference on a compose table, and possibly free it.
287 *
288 * @param table The object. If it is NULL, this function does nothing.
289 *
290 * @memberof xkb_compose_table
291 */
292void
293xkb_compose_table_unref(struct xkb_compose_table *table);
294
295/** Flags for compose state creation. */
296enum xkb_compose_state_flags {
297 /** Do not apply any flags. */
298 XKB_COMPOSE_STATE_NO_FLAGS = 0
299};
300
301/**
302 * Create a new compose state object.
303 *
304 * @param table
305 * The compose table the state will use.
306 * @param flags
307 * Optional flags for the compose state, or 0.
308 *
309 * @returns A new compose state, or NULL on failure.
310 *
311 * @memberof xkb_compose_state
312 */
313struct xkb_compose_state *
314xkb_compose_state_new(struct xkb_compose_table *table,
315 enum xkb_compose_state_flags flags);
316
317/**
318 * Take a new reference on a compose state object.
319 *
320 * @returns The passed in object.
321 *
322 * @memberof xkb_compose_state
323 */
324struct xkb_compose_state *
325xkb_compose_state_ref(struct xkb_compose_state *state);
326
327/**
328 * Release a reference on a compose state object, and possibly free it.
329 *
330 * @param state The object. If NULL, do nothing.
331 *
332 * @memberof xkb_compose_state
333 */
334void
335xkb_compose_state_unref(struct xkb_compose_state *state);
336
337/**
338 * Get the compose table which a compose state object is using.
339 *
340 * @returns The compose table which was passed to xkb_compose_state_new()
341 * when creating this state object.
342 *
343 * This function does not take a new reference on the compose table; you
344 * must explicitly reference it yourself if you plan to use it beyond the
345 * lifetime of the state.
346 *
347 * @memberof xkb_compose_state
348 */
349struct xkb_compose_table *
350xkb_compose_state_get_compose_table(struct xkb_compose_state *state);
351
352/** Status of the Compose sequence state machine. */
353enum xkb_compose_status {
354 /** The initial state; no sequence has started yet. */
355 XKB_COMPOSE_NOTHING,
356 /** In the middle of a sequence. */
357 XKB_COMPOSE_COMPOSING,
358 /** A complete sequence has been matched. */
359 XKB_COMPOSE_COMPOSED,
360 /** The last sequence was cancelled due to an unmatched keysym. */
361 XKB_COMPOSE_CANCELLED
362};
363
364/** The effect of a keysym fed to xkb_compose_state_feed(). */
365enum xkb_compose_feed_result {
366 /** The keysym had no effect - it did not affect the status. */
367 XKB_COMPOSE_FEED_IGNORED,
368 /** The keysym started, advanced or cancelled a sequence. */
369 XKB_COMPOSE_FEED_ACCEPTED
370};
371
372/**
373 * Feed one keysym to the Compose sequence state machine.
374 *
375 * This function can advance into a compose sequence, cancel a sequence,
376 * start a new sequence, or do nothing in particular. The resulting
377 * status may be observed with xkb_compose_state_get_status().
378 *
379 * Some keysyms, such as keysyms for modifier keys, are ignored - they
380 * have no effect on the status or otherwise.
381 *
382 * The following is a description of the possible status transitions, in
383 * the format CURRENT STATUS => NEXT STATUS, given a non-ignored input
384 * keysym `keysym`:
385 *
386 @verbatim
387 NOTHING or CANCELLED or COMPOSED =>
388 NOTHING if keysym does not start a sequence.
389 COMPOSING if keysym starts a sequence.
390 COMPOSED if keysym starts and terminates a single-keysym sequence.
391
392 COMPOSING =>
393 COMPOSING if keysym advances any of the currently possible
394 sequences but does not terminate any of them.
395 COMPOSED if keysym terminates one of the currently possible
396 sequences.
397 CANCELLED if keysym does not advance any of the currently
398 possible sequences.
399 @endverbatim
400 *
401 * The current Compose formats do not support multiple-keysyms.
402 * Therefore, if you are using a function such as xkb_state_key_get_syms()
403 * and it returns more than one keysym, consider feeding XKB_KEY_NoSymbol
404 * instead.
405 *
406 * @param state
407 * The compose state object.
408 * @param keysym
409 * A keysym, usually obtained after a key-press event, with a
410 * function such as xkb_state_key_get_one_sym().
411 *
412 * @returns Whether the keysym was ignored. This is useful, for example,
413 * if you want to keep a record of the sequence matched thus far.
414 *
415 * @memberof xkb_compose_state
416 */
417enum xkb_compose_feed_result
418xkb_compose_state_feed(struct xkb_compose_state *state,
419 xkb_keysym_t keysym);
420
421/**
422 * Reset the Compose sequence state machine.
423 *
424 * The status is set to XKB_COMPOSE_NOTHING, and the current sequence
425 * is discarded.
426 *
427 * @memberof xkb_compose_state
428 */
429void
430xkb_compose_state_reset(struct xkb_compose_state *state);
431
432/**
433 * Get the current status of the compose state machine.
434 *
435 * @see xkb_compose_status
436 * @memberof xkb_compose_state
437 **/
438enum xkb_compose_status
439xkb_compose_state_get_status(struct xkb_compose_state *state);
440
441/**
442 * Get the result Unicode/UTF-8 string for a composed sequence.
443 *
444 * See @ref compose-overview for more details. This function is only
445 * useful when the status is XKB_COMPOSE_COMPOSED.
446 *
447 * @param[in] state
448 * The compose state.
449 * @param[out] buffer
450 * A buffer to write the string into.
451 * @param[in] size
452 * Size of the buffer.
453 *
454 * @warning If the buffer passed is too small, the string is truncated
455 * (though still NUL-terminated).
456 *
457 * @returns
458 * The number of bytes required for the string, excluding the NUL byte.
459 * If the sequence is not complete, or does not have a viable result
460 * string, returns 0, and sets `buffer` to the empty string (if possible).
461 * @returns
462 * You may check if truncation has occurred by comparing the return value
463 * with the size of `buffer`, similarly to the `snprintf`(3) function.
464 * You may safely pass NULL and 0 to `buffer` and `size` to find the
465 * required size (without the NUL-byte).
466 *
467 * @memberof xkb_compose_state
468 **/
469int
470xkb_compose_state_get_utf8(struct xkb_compose_state *state,
471 char *buffer, size_t size);
472
473/**
474 * Get the result keysym for a composed sequence.
475 *
476 * See @ref compose-overview for more details. This function is only
477 * useful when the status is XKB_COMPOSE_COMPOSED.
478 *
479 * @returns The result keysym. If the sequence is not complete, or does
480 * not specify a result keysym, returns XKB_KEY_NoSymbol.
481 *
482 * @memberof xkb_compose_state
483 **/
484xkb_keysym_t
485xkb_compose_state_get_one_sym(struct xkb_compose_state *state);
486
487/** @} */
488
489#ifdef __cplusplus
490} /* extern "C" */
491#endif
492
493#endif /* _XKBCOMMON_COMPOSE_H */
494