1 | // © 2016 and later: Unicode, Inc. and others. |
2 | // License & terms of use: http://www.unicode.org/copyright.html |
3 | /* |
4 | ******************************************************************************* |
5 | * |
6 | * Copyright (C) 2003-2014, International Business Machines |
7 | * Corporation and others. All Rights Reserved. |
8 | * |
9 | ******************************************************************************* |
10 | * file name: usprep.h |
11 | * encoding: UTF-8 |
12 | * tab size: 8 (not used) |
13 | * indentation:4 |
14 | * |
15 | * created on: 2003jul2 |
16 | * created by: Ram Viswanadha |
17 | */ |
18 | |
19 | #ifndef __USPREP_H__ |
20 | #define __USPREP_H__ |
21 | |
22 | /** |
23 | * \file |
24 | * \brief C API: Implements the StringPrep algorithm. |
25 | */ |
26 | |
27 | #include "unicode/utypes.h" |
28 | #include "unicode/localpointer.h" |
29 | |
30 | /** |
31 | * |
32 | * StringPrep API implements the StingPrep framework as described by RFC 3454. |
33 | * StringPrep prepares Unicode strings for use in network protocols. |
34 | * Profiles of StingPrep are set of rules and data according to with the |
35 | * Unicode Strings are prepared. Each profiles contains tables which describe |
36 | * how a code point should be treated. The tables are broadly classified into |
37 | * <ul> |
38 | * <li> Unassigned Table: Contains code points that are unassigned |
39 | * in the Unicode Version supported by StringPrep. Currently |
40 | * RFC 3454 supports Unicode 3.2. </li> |
41 | * <li> Prohibited Table: Contains code points that are prohibited from |
42 | * the output of the StringPrep processing function. </li> |
43 | * <li> Mapping Table: Contains code points that are deleted from the output or case mapped. </li> |
44 | * </ul> |
45 | * |
46 | * The procedure for preparing Unicode strings: |
47 | * <ol> |
48 | * <li> Map: For each character in the input, check if it has a mapping |
49 | * and, if so, replace it with its mapping. </li> |
50 | * <li> Normalize: Possibly normalize the result of step 1 using Unicode |
51 | * normalization. </li> |
52 | * <li> Prohibit: Check for any characters that are not allowed in the |
53 | * output. If any are found, return an error.</li> |
54 | * <li> Check bidi: Possibly check for right-to-left characters, and if |
55 | * any are found, make sure that the whole string satisfies the |
56 | * requirements for bidirectional strings. If the string does not |
57 | * satisfy the requirements for bidirectional strings, return an |
58 | * error. </li> |
59 | * </ol> |
60 | * @author Ram Viswanadha |
61 | */ |
62 | #if !UCONFIG_NO_IDNA |
63 | |
64 | #include "unicode/parseerr.h" |
65 | |
66 | /** |
67 | * The StringPrep profile |
68 | * @stable ICU 2.8 |
69 | */ |
70 | typedef struct UStringPrepProfile UStringPrepProfile; |
71 | |
72 | |
73 | /** |
74 | * Option to prohibit processing of unassigned code points in the input |
75 | * |
76 | * @see usprep_prepare |
77 | * @stable ICU 2.8 |
78 | */ |
79 | #define USPREP_DEFAULT 0x0000 |
80 | |
81 | /** |
82 | * Option to allow processing of unassigned code points in the input |
83 | * |
84 | * @see usprep_prepare |
85 | * @stable ICU 2.8 |
86 | */ |
87 | #define USPREP_ALLOW_UNASSIGNED 0x0001 |
88 | |
89 | /** |
90 | * enums for the standard stringprep profile types |
91 | * supported by usprep_openByType. |
92 | * @see usprep_openByType |
93 | * @stable ICU 4.2 |
94 | */ |
95 | typedef enum UStringPrepProfileType { |
96 | /** |
97 | * RFC3491 Nameprep |
98 | * @stable ICU 4.2 |
99 | */ |
100 | USPREP_RFC3491_NAMEPREP, |
101 | /** |
102 | * RFC3530 nfs4_cs_prep |
103 | * @stable ICU 4.2 |
104 | */ |
105 | USPREP_RFC3530_NFS4_CS_PREP, |
106 | /** |
107 | * RFC3530 nfs4_cs_prep with case insensitive option |
108 | * @stable ICU 4.2 |
109 | */ |
110 | USPREP_RFC3530_NFS4_CS_PREP_CI, |
111 | /** |
112 | * RFC3530 nfs4_cis_prep |
113 | * @stable ICU 4.2 |
114 | */ |
115 | USPREP_RFC3530_NFS4_CIS_PREP, |
116 | /** |
117 | * RFC3530 nfs4_mixed_prep for prefix |
118 | * @stable ICU 4.2 |
119 | */ |
120 | USPREP_RFC3530_NFS4_MIXED_PREP_PREFIX, |
121 | /** |
122 | * RFC3530 nfs4_mixed_prep for suffix |
123 | * @stable ICU 4.2 |
124 | */ |
125 | USPREP_RFC3530_NFS4_MIXED_PREP_SUFFIX, |
126 | /** |
127 | * RFC3722 iSCSI |
128 | * @stable ICU 4.2 |
129 | */ |
130 | USPREP_RFC3722_ISCSI, |
131 | /** |
132 | * RFC3920 XMPP Nodeprep |
133 | * @stable ICU 4.2 |
134 | */ |
135 | USPREP_RFC3920_NODEPREP, |
136 | /** |
137 | * RFC3920 XMPP Resourceprep |
138 | * @stable ICU 4.2 |
139 | */ |
140 | USPREP_RFC3920_RESOURCEPREP, |
141 | /** |
142 | * RFC4011 Policy MIB Stringprep |
143 | * @stable ICU 4.2 |
144 | */ |
145 | USPREP_RFC4011_MIB, |
146 | /** |
147 | * RFC4013 SASLprep |
148 | * @stable ICU 4.2 |
149 | */ |
150 | USPREP_RFC4013_SASLPREP, |
151 | /** |
152 | * RFC4505 trace |
153 | * @stable ICU 4.2 |
154 | */ |
155 | USPREP_RFC4505_TRACE, |
156 | /** |
157 | * RFC4518 LDAP |
158 | * @stable ICU 4.2 |
159 | */ |
160 | USPREP_RFC4518_LDAP, |
161 | /** |
162 | * RFC4518 LDAP for case ignore, numeric and stored prefix |
163 | * matching rules |
164 | * @stable ICU 4.2 |
165 | */ |
166 | USPREP_RFC4518_LDAP_CI |
167 | } UStringPrepProfileType; |
168 | |
169 | /** |
170 | * Creates a StringPrep profile from the data file. |
171 | * |
172 | * @param path string containing the full path pointing to the directory |
173 | * where the profile reside followed by the package name |
174 | * e.g. "/usr/resource/my_app/profiles/mydata" on a Unix system. |
175 | * if NULL, ICU default data files will be used. |
176 | * @param fileName name of the profile file to be opened |
177 | * @param status ICU error code in/out parameter. Must not be NULL. |
178 | * Must fulfill U_SUCCESS before the function call. |
179 | * @return Pointer to UStringPrepProfile that is opened. Should be closed by |
180 | * calling usprep_close() |
181 | * @see usprep_close() |
182 | * @stable ICU 2.8 |
183 | */ |
184 | U_STABLE UStringPrepProfile* U_EXPORT2 |
185 | usprep_open(const char* path, |
186 | const char* fileName, |
187 | UErrorCode* status); |
188 | |
189 | /** |
190 | * Creates a StringPrep profile for the specified profile type. |
191 | * |
192 | * @param type The profile type |
193 | * @param status ICU error code in/out parameter. Must not be NULL. |
194 | * Must fulfill U_SUCCESS before the function call. |
195 | * @return Pointer to UStringPrepProfile that is opened. Should be closed by |
196 | * calling usprep_close() |
197 | * @see usprep_close() |
198 | * @stable ICU 4.2 |
199 | */ |
200 | U_STABLE UStringPrepProfile* U_EXPORT2 |
201 | usprep_openByType(UStringPrepProfileType type, |
202 | UErrorCode* status); |
203 | |
204 | /** |
205 | * Closes the profile |
206 | * @param profile The profile to close |
207 | * @stable ICU 2.8 |
208 | */ |
209 | U_STABLE void U_EXPORT2 |
210 | usprep_close(UStringPrepProfile* profile); |
211 | |
212 | #if U_SHOW_CPLUSPLUS_API |
213 | |
214 | U_NAMESPACE_BEGIN |
215 | |
216 | /** |
217 | * \class LocalUStringPrepProfilePointer |
218 | * "Smart pointer" class, closes a UStringPrepProfile via usprep_close(). |
219 | * For most methods see the LocalPointerBase base class. |
220 | * |
221 | * @see LocalPointerBase |
222 | * @see LocalPointer |
223 | * @stable ICU 4.4 |
224 | */ |
225 | U_DEFINE_LOCAL_OPEN_POINTER(LocalUStringPrepProfilePointer, UStringPrepProfile, usprep_close); |
226 | |
227 | U_NAMESPACE_END |
228 | |
229 | #endif |
230 | |
231 | /** |
232 | * Prepare the input buffer for use in applications with the given profile. This operation maps, normalizes(NFKC), |
233 | * checks for prohibited and BiDi characters in the order defined by RFC 3454 |
234 | * depending on the options specified in the profile. |
235 | * |
236 | * @param prep The profile to use |
237 | * @param src Pointer to UChar buffer containing the string to prepare |
238 | * @param srcLength Number of characters in the source string |
239 | * @param dest Pointer to the destination buffer to receive the output |
240 | * @param destCapacity The capacity of destination array |
241 | * @param options A bit set of options: |
242 | * |
243 | * - USPREP_DEFAULT Prohibit processing of unassigned code points in the input |
244 | * |
245 | * - USPREP_ALLOW_UNASSIGNED Treat the unassigned code points are in the input |
246 | * as normal Unicode code points. |
247 | * |
248 | * @param parseError Pointer to UParseError struct to receive information on position |
249 | * of error if an error is encountered. Can be NULL. |
250 | * @param status ICU in/out error code parameter. |
251 | * U_INVALID_CHAR_FOUND if src contains |
252 | * unmatched single surrogates. |
253 | * U_INDEX_OUTOFBOUNDS_ERROR if src contains |
254 | * too many code points. |
255 | * U_BUFFER_OVERFLOW_ERROR if destCapacity is not enough |
256 | * @return The number of UChars in the destination buffer |
257 | * @stable ICU 2.8 |
258 | */ |
259 | |
260 | U_STABLE int32_t U_EXPORT2 |
261 | usprep_prepare( const UStringPrepProfile* prep, |
262 | const UChar* src, int32_t srcLength, |
263 | UChar* dest, int32_t destCapacity, |
264 | int32_t options, |
265 | UParseError* parseError, |
266 | UErrorCode* status ); |
267 | |
268 | |
269 | #endif /* #if !UCONFIG_NO_IDNA */ |
270 | |
271 | #endif |
272 | |