1// © 2016 and later: Unicode, Inc. and others.
2// License & terms of use: http://www.unicode.org/copyright.html
3/*
4**********************************************************************
5* Copyright (C) 2000-2004, International Business Machines
6* Corporation and others. All Rights Reserved.
7**********************************************************************
8 * ucnv_cb.h:
9 * External APIs for the ICU's codeset conversion library
10 * Helena Shih
11 *
12 * Modification History:
13 *
14 * Date Name Description
15 */
16
17/**
18 * \file
19 * \brief C UConverter functions to aid the writers of callbacks
20 *
21 * <h2> Callback API for UConverter </h2>
22 *
23 * These functions are provided here for the convenience of the callback
24 * writer. If you are just looking for callback functions to use, please
25 * see ucnv_err.h. DO NOT call these functions directly when you are
26 * working with converters, unless your code has been called as a callback
27 * via ucnv_setFromUCallback or ucnv_setToUCallback !!
28 *
29 * A note about error codes and overflow. Unlike other ICU functions,
30 * these functions do not expect the error status to be U_ZERO_ERROR.
31 * Callbacks must be much more careful about their error codes.
32 * The error codes used here are in/out parameters, which should be passed
33 * back in the callback's error parameter.
34 *
35 * For example, if you call ucnv_cbfromUWriteBytes to write data out
36 * to the output codepage, it may return U_BUFFER_OVERFLOW_ERROR if
37 * the data did not fit in the target. But this isn't a failing error,
38 * in fact, ucnv_cbfromUWriteBytes may be called AGAIN with the error
39 * status still U_BUFFER_OVERFLOW_ERROR to attempt to write further bytes,
40 * which will also go into the internal overflow buffers.
41 *
42 * Concerning offsets, the 'offset' parameters here are relative to the start
43 * of SOURCE. For example, Suppose the string "ABCD" was being converted
44 * from Unicode into a codepage which doesn't have a mapping for 'B'.
45 * 'A' will be written out correctly, but
46 * The FromU Callback will be called on an unassigned character for 'B'.
47 * At this point, this is the state of the world:
48 * Target: A [..] [points after A]
49 * Source: A B [C] D [points to C - B has been consumed]
50 * 0 1 2 3
51 * codePoint = "B" [the unassigned codepoint]
52 *
53 * Now, suppose a callback wants to write the substitution character '?' to
54 * the target. It calls ucnv_cbFromUWriteBytes() to write the ?.
55 * It should pass ZERO as the offset, because the offset as far as the
56 * callback is concerned is relative to the SOURCE pointer [which points
57 * before 'C'.] If the callback goes into the args and consumes 'C' also,
58 * it would call FromUWriteBytes with an offset of 1 (and advance the source
59 * pointer).
60 *
61 */
62
63#ifndef UCNV_CB_H
64#define UCNV_CB_H
65
66#include "unicode/utypes.h"
67
68#if !UCONFIG_NO_CONVERSION
69
70#include "unicode/ucnv.h"
71#include "unicode/ucnv_err.h"
72
73/**
74 * ONLY used by FromU callback functions.
75 * Writes out the specified byte output bytes to the target byte buffer or to converter internal buffers.
76 *
77 * @param args callback fromUnicode arguments
78 * @param source source bytes to write
79 * @param length length of bytes to write
80 * @param offsetIndex the relative offset index from callback.
81 * @param err error status. If <TT>U_BUFFER_OVERFLOW</TT> is returned, then U_BUFFER_OVERFLOW <STRONG>must</STRONG>
82 * be returned to the user, because it means that not all data could be written into the target buffer, and some is
83 * in the converter error buffer.
84 * @see ucnv_cbFromUWriteSub
85 * @stable ICU 2.0
86 */
87U_STABLE void U_EXPORT2
88ucnv_cbFromUWriteBytes (UConverterFromUnicodeArgs *args,
89 const char* source,
90 int32_t length,
91 int32_t offsetIndex,
92 UErrorCode * err);
93
94/**
95 * ONLY used by FromU callback functions.
96 * This function will write out the correct substitution character sequence
97 * to the target.
98 *
99 * @param args callback fromUnicode arguments
100 * @param offsetIndex the relative offset index from the current source pointer to be used
101 * @param err error status. If <TT>U_BUFFER_OVERFLOW</TT> is returned, then U_BUFFER_OVERFLOW <STRONG>must</STRONG>
102 * be returned to the user, because it means that not all data could be written into the target buffer, and some is
103 * in the converter error buffer.
104 * @see ucnv_cbFromUWriteBytes
105 * @stable ICU 2.0
106 */
107U_STABLE void U_EXPORT2
108ucnv_cbFromUWriteSub (UConverterFromUnicodeArgs *args,
109 int32_t offsetIndex,
110 UErrorCode * err);
111
112/**
113 * ONLY used by fromU callback functions.
114 * This function will write out the error character(s) to the target UChar buffer.
115 *
116 * @param args callback fromUnicode arguments
117 * @param source pointer to pointer to first UChar to write [on exit: 1 after last UChar processed]
118 * @param sourceLimit pointer after last UChar to write
119 * @param offsetIndex the relative offset index from callback which will be set
120 * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
121 * @see ucnv_cbToUWriteSub
122 * @stable ICU 2.0
123 */
124U_STABLE void U_EXPORT2 ucnv_cbFromUWriteUChars(UConverterFromUnicodeArgs *args,
125 const UChar** source,
126 const UChar* sourceLimit,
127 int32_t offsetIndex,
128 UErrorCode * err);
129
130/**
131 * ONLY used by ToU callback functions.
132 * This function will write out the specified characters to the target
133 * UChar buffer.
134 *
135 * @param args callback toUnicode arguments
136 * @param source source string to write
137 * @param length the length of source string
138 * @param offsetIndex the relative offset index which will be written.
139 * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
140 * @see ucnv_cbToUWriteSub
141 * @stable ICU 2.0
142 */
143U_STABLE void U_EXPORT2 ucnv_cbToUWriteUChars (UConverterToUnicodeArgs *args,
144 const UChar* source,
145 int32_t length,
146 int32_t offsetIndex,
147 UErrorCode * err);
148
149/**
150 * ONLY used by ToU callback functions.
151 * This function will write out the Unicode substitution character (U+FFFD).
152 *
153 * @param args callback fromUnicode arguments
154 * @param offsetIndex the relative offset index from callback.
155 * @param err error status <TT>U_BUFFER_OVERFLOW</TT>
156 * @see ucnv_cbToUWriteUChars
157 * @stable ICU 2.0
158 */
159U_STABLE void U_EXPORT2 ucnv_cbToUWriteSub (UConverterToUnicodeArgs *args,
160 int32_t offsetIndex,
161 UErrorCode * err);
162#endif
163
164#endif
165