1 // © 2016 and later: Unicode, Inc. and others. 2 // License & terms of use: http://www.unicode.org/copyright.html 3 /* 4 ******************************************************************************* 5 * 6 * Copyright (C) 2003-2014, International Business Machines 7 * Corporation and others. All Rights Reserved. 8 * 9 ******************************************************************************* 10 * file name: usprep.h 11 * encoding: UTF-8 12 * tab size: 8 (not used) 13 * indentation:4 14 * 15 * created on: 2003jul2 16 * created by: Ram Viswanadha 17 */ 18 19 #ifndef __USPREP_H__ 20 #define __USPREP_H__ 21 22 /** 23 * \file 24 * \brief C API: Implements the StringPrep algorithm. 25 */ 26 27 #include "unicode/utypes.h" 28 #include "unicode/localpointer.h" 29 30 /** 31 * 32 * StringPrep API implements the StingPrep framework as described by RFC 3454. 33 * StringPrep prepares Unicode strings for use in network protocols. 34 * Profiles of StingPrep are set of rules and data according to with the 35 * Unicode Strings are prepared. Each profiles contains tables which describe 36 * how a code point should be treated. The tables are broadly classified into 37 * <ul> 38 * <li> Unassigned Table: Contains code points that are unassigned 39 * in the Unicode Version supported by StringPrep. Currently 40 * RFC 3454 supports Unicode 3.2. </li> 41 * <li> Prohibited Table: Contains code points that are prohibited from 42 * the output of the StringPrep processing function. </li> 43 * <li> Mapping Table: Contains code points that are deleted from the output or case mapped. </li> 44 * </ul> 45 * 46 * The procedure for preparing Unicode strings: 47 * <ol> 48 * <li> Map: For each character in the input, check if it has a mapping 49 * and, if so, replace it with its mapping. </li> 50 * <li> Normalize: Possibly normalize the result of step 1 using Unicode 51 * normalization. </li> 52 * <li> Prohibit: Check for any characters that are not allowed in the 53 * output. If any are found, return an error.</li> 54 * <li> Check bidi: Possibly check for right-to-left characters, and if 55 * any are found, make sure that the whole string satisfies the 56 * requirements for bidirectional strings. If the string does not 57 * satisfy the requirements for bidirectional strings, return an 58 * error. </li> 59 * </ol> 60 * @author Ram Viswanadha 61 */ 62 #if !UCONFIG_NO_IDNA 63 64 #include "unicode/parseerr.h" 65 66 /** 67 * The StringPrep profile 68 * @stable ICU 2.8 69 */ 70 typedef struct UStringPrepProfile UStringPrepProfile; 71 72 73 /** 74 * Option to prohibit processing of unassigned code points in the input 75 * 76 * @see usprep_prepare 77 * @stable ICU 2.8 78 */ 79 #define USPREP_DEFAULT 0x0000 80 81 /** 82 * Option to allow processing of unassigned code points in the input 83 * 84 * @see usprep_prepare 85 * @stable ICU 2.8 86 */ 87 #define USPREP_ALLOW_UNASSIGNED 0x0001 88 89 /** 90 * enums for the standard stringprep profile types 91 * supported by usprep_openByType. 92 * @see usprep_openByType 93 * @stable ICU 4.2 94 */ 95 typedef enum UStringPrepProfileType { 96 /** 97 * RFC3491 Nameprep 98 * @stable ICU 4.2 99 */ 100 USPREP_RFC3491_NAMEPREP, 101 /** 102 * RFC3530 nfs4_cs_prep 103 * @stable ICU 4.2 104 */ 105 USPREP_RFC3530_NFS4_CS_PREP, 106 /** 107 * RFC3530 nfs4_cs_prep with case insensitive option 108 * @stable ICU 4.2 109 */ 110 USPREP_RFC3530_NFS4_CS_PREP_CI, 111 /** 112 * RFC3530 nfs4_cis_prep 113 * @stable ICU 4.2 114 */ 115 USPREP_RFC3530_NFS4_CIS_PREP, 116 /** 117 * RFC3530 nfs4_mixed_prep for prefix 118 * @stable ICU 4.2 119 */ 120 USPREP_RFC3530_NFS4_MIXED_PREP_PREFIX, 121 /** 122 * RFC3530 nfs4_mixed_prep for suffix 123 * @stable ICU 4.2 124 */ 125 USPREP_RFC3530_NFS4_MIXED_PREP_SUFFIX, 126 /** 127 * RFC3722 iSCSI 128 * @stable ICU 4.2 129 */ 130 USPREP_RFC3722_ISCSI, 131 /** 132 * RFC3920 XMPP Nodeprep 133 * @stable ICU 4.2 134 */ 135 USPREP_RFC3920_NODEPREP, 136 /** 137 * RFC3920 XMPP Resourceprep 138 * @stable ICU 4.2 139 */ 140 USPREP_RFC3920_RESOURCEPREP, 141 /** 142 * RFC4011 Policy MIB Stringprep 143 * @stable ICU 4.2 144 */ 145 USPREP_RFC4011_MIB, 146 /** 147 * RFC4013 SASLprep 148 * @stable ICU 4.2 149 */ 150 USPREP_RFC4013_SASLPREP, 151 /** 152 * RFC4505 trace 153 * @stable ICU 4.2 154 */ 155 USPREP_RFC4505_TRACE, 156 /** 157 * RFC4518 LDAP 158 * @stable ICU 4.2 159 */ 160 USPREP_RFC4518_LDAP, 161 /** 162 * RFC4518 LDAP for case ignore, numeric and stored prefix 163 * matching rules 164 * @stable ICU 4.2 165 */ 166 USPREP_RFC4518_LDAP_CI 167 } UStringPrepProfileType; 168 169 /** 170 * Creates a StringPrep profile from the data file. 171 * 172 * @param path string containing the full path pointing to the directory 173 * where the profile reside followed by the package name 174 * e.g. "/usr/resource/my_app/profiles/mydata" on a Unix system. 175 * if NULL, ICU default data files will be used. 176 * @param fileName name of the profile file to be opened 177 * @param status ICU error code in/out parameter. Must not be NULL. 178 * Must fulfill U_SUCCESS before the function call. 179 * @return Pointer to UStringPrepProfile that is opened. Should be closed by 180 * calling usprep_close() 181 * @see usprep_close() 182 * @stable ICU 2.8 183 */ 184 U_STABLE UStringPrepProfile* U_EXPORT2 185 usprep_open(const char* path, 186 const char* fileName, 187 UErrorCode* status); 188 189 /** 190 * Creates a StringPrep profile for the specified profile type. 191 * 192 * @param type The profile type 193 * @param status ICU error code in/out parameter. Must not be NULL. 194 * Must fulfill U_SUCCESS before the function call. 195 * @return Pointer to UStringPrepProfile that is opened. Should be closed by 196 * calling usprep_close() 197 * @see usprep_close() 198 * @stable ICU 4.2 199 */ 200 U_STABLE UStringPrepProfile* U_EXPORT2 201 usprep_openByType(UStringPrepProfileType type, 202 UErrorCode* status); 203 204 /** 205 * Closes the profile 206 * @param profile The profile to close 207 * @stable ICU 2.8 208 */ 209 U_STABLE void U_EXPORT2 210 usprep_close(UStringPrepProfile* profile); 211 212 #if U_SHOW_CPLUSPLUS_API 213 214 U_NAMESPACE_BEGIN 215 216 /** 217 * \class LocalUStringPrepProfilePointer 218 * "Smart pointer" class, closes a UStringPrepProfile via usprep_close(). 219 * For most methods see the LocalPointerBase base class. 220 * 221 * @see LocalPointerBase 222 * @see LocalPointer 223 * @stable ICU 4.4 224 */ 225 U_DEFINE_LOCAL_OPEN_POINTER(LocalUStringPrepProfilePointer, UStringPrepProfile, usprep_close); 226 227 U_NAMESPACE_END 228 229 #endif 230 231 /** 232 * Prepare the input buffer for use in applications with the given profile. This operation maps, normalizes(NFKC), 233 * checks for prohibited and BiDi characters in the order defined by RFC 3454 234 * depending on the options specified in the profile. 235 * 236 * @param prep The profile to use 237 * @param src Pointer to UChar buffer containing the string to prepare 238 * @param srcLength Number of characters in the source string 239 * @param dest Pointer to the destination buffer to receive the output 240 * @param destCapacity The capacity of destination array 241 * @param options A bit set of options: 242 * 243 * - USPREP_DEFAULT Prohibit processing of unassigned code points in the input 244 * 245 * - USPREP_ALLOW_UNASSIGNED Treat the unassigned code points are in the input 246 * as normal Unicode code points. 247 * 248 * @param parseError Pointer to UParseError struct to receive information on position 249 * of error if an error is encountered. Can be NULL. 250 * @param status ICU in/out error code parameter. 251 * U_INVALID_CHAR_FOUND if src contains 252 * unmatched single surrogates. 253 * U_INDEX_OUTOFBOUNDS_ERROR if src contains 254 * too many code points. 255 * U_BUFFER_OVERFLOW_ERROR if destCapacity is not enough 256 * @return The number of UChars in the destination buffer 257 * @stable ICU 2.8 258 */ 259 260 U_STABLE int32_t U_EXPORT2 261 usprep_prepare( const UStringPrepProfile* prep, 262 const UChar* src, int32_t srcLength, 263 UChar* dest, int32_t destCapacity, 264 int32_t options, 265 UParseError* parseError, 266 UErrorCode* status ); 267 268 269 #endif /* #if !UCONFIG_NO_IDNA */ 270 271 #endif 272