1 /*
2 *******************************************************************************
3 *
4 * Copyright (C) 2003-2012, International Business Machines
5 * Corporation and others. All Rights Reserved.
6 *
7 *******************************************************************************
8 * file name: testidna.cpp
9 * encoding: US-ASCII
10 * tab size: 8 (not used)
11 * indentation:4
12 *
13 * created on: 2003feb1
14 * created by: Ram Viswanadha
15 */
16
17 #include "unicode/utypes.h"
18
19 #if !UCONFIG_NO_IDNA && !UCONFIG_NO_TRANSLITERATION
20
21 #include <time.h>
22 #include <limits.h>
23 #include <stdlib.h>
24 #include <string.h>
25 #include "unicode/localpointer.h"
26 #include "unicode/ustring.h"
27 #include "unicode/usprep.h"
28 #include "unicode/uniset.h"
29 #include "testidna.h"
30 #include "idnaref.h"
31 #include "nptrans.h"
32 #include "unicode/putil.h"
33 #include "idnaconf.h"
34
35 static const UChar unicodeIn[][41] ={
36 {
37 0x0644, 0x064A, 0x0647, 0x0645, 0x0627, 0x0628, 0x062A, 0x0643, 0x0644,
38 0x0645, 0x0648, 0x0634, 0x0639, 0x0631, 0x0628, 0x064A, 0x061F, 0x0000
39 },
40 {
41 0x4ED6, 0x4EEC, 0x4E3A, 0x4EC0, 0x4E48, 0x4E0D, 0x8BF4, 0x4E2D, 0x6587,
42 0x0000
43 },
44 {
45 0x0050, 0x0072, 0x006F, 0x010D, 0x0070, 0x0072, 0x006F, 0x0073, 0x0074,
46 0x011B, 0x006E, 0x0065, 0x006D, 0x006C, 0x0075, 0x0076, 0x00ED, 0x010D,
47 0x0065, 0x0073, 0x006B, 0x0079, 0x0000
48 },
49 {
50 0x05DC, 0x05DE, 0x05D4, 0x05D4, 0x05DD, 0x05E4, 0x05E9, 0x05D5, 0x05D8,
51 0x05DC, 0x05D0, 0x05DE, 0x05D3, 0x05D1, 0x05E8, 0x05D9, 0x05DD, 0x05E2,
52 0x05D1, 0x05E8, 0x05D9, 0x05EA, 0x0000
53 },
54 {
55 0x092F, 0x0939, 0x0932, 0x094B, 0x0917, 0x0939, 0x093F, 0x0928, 0x094D,
56 0x0926, 0x0940, 0x0915, 0x094D, 0x092F, 0x094B, 0x0902, 0x0928, 0x0939,
57 0x0940, 0x0902, 0x092C, 0x094B, 0x0932, 0x0938, 0x0915, 0x0924, 0x0947,
58 0x0939, 0x0948, 0x0902, 0x0000
59 },
60 {
61 0x306A, 0x305C, 0x307F, 0x3093, 0x306A, 0x65E5, 0x672C, 0x8A9E, 0x3092,
62 0x8A71, 0x3057, 0x3066, 0x304F, 0x308C, 0x306A, 0x3044, 0x306E, 0x304B,
63 0x0000
64 },
65 /*
66 {
67 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
68 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
69 0xC5BC, 0xB9C8, 0xB098, 0xC88B, 0xC744, 0xAE4C, 0x0000
70 },
71 */
72 {
73 0x043F, 0x043E, 0x0447, 0x0435, 0x043C, 0x0443, 0x0436, 0x0435, 0x043E,
74 0x043D, 0x0438, 0x043D, 0x0435, 0x0433, 0x043E, 0x0432, 0x043E, 0x0440,
75 0x044F, 0x0442, 0x043F, 0x043E, 0x0440, 0x0443, 0x0441, 0x0441, 0x043A,
76 0x0438, 0x0000
77 },
78 {
79 0x0050, 0x006F, 0x0072, 0x0071, 0x0075, 0x00E9, 0x006E, 0x006F, 0x0070,
80 0x0075, 0x0065, 0x0064, 0x0065, 0x006E, 0x0073, 0x0069, 0x006D, 0x0070,
81 0x006C, 0x0065, 0x006D, 0x0065, 0x006E, 0x0074, 0x0065, 0x0068, 0x0061,
82 0x0062, 0x006C, 0x0061, 0x0072, 0x0065, 0x006E, 0x0045, 0x0073, 0x0070,
83 0x0061, 0x00F1, 0x006F, 0x006C, 0x0000
84 },
85 {
86 0x4ED6, 0x5011, 0x7232, 0x4EC0, 0x9EBD, 0x4E0D, 0x8AAA, 0x4E2D, 0x6587,
87 0x0000
88 },
89 {
90 0x0054, 0x1EA1, 0x0069, 0x0073, 0x0061, 0x006F, 0x0068, 0x1ECD, 0x006B,
91 0x0068, 0x00F4, 0x006E, 0x0067, 0x0074, 0x0068, 0x1EC3, 0x0063, 0x0068,
92 0x1EC9, 0x006E, 0x00F3, 0x0069, 0x0074, 0x0069, 0x1EBF, 0x006E, 0x0067,
93 0x0056, 0x0069, 0x1EC7, 0x0074, 0x0000
94 },
95 {
96 0x0033, 0x5E74, 0x0042, 0x7D44, 0x91D1, 0x516B, 0x5148, 0x751F, 0x0000
97 },
98 {
99 0x5B89, 0x5BA4, 0x5948, 0x7F8E, 0x6075, 0x002D, 0x0077, 0x0069, 0x0074,
100 0x0068, 0x002D, 0x0053, 0x0055, 0x0050, 0x0045, 0x0052, 0x002D, 0x004D,
101 0x004F, 0x004E, 0x004B, 0x0045, 0x0059, 0x0053, 0x0000
102 },
103 {
104 0x0048, 0x0065, 0x006C, 0x006C, 0x006F, 0x002D, 0x0041, 0x006E, 0x006F,
105 0x0074, 0x0068, 0x0065, 0x0072, 0x002D, 0x0057, 0x0061, 0x0079, 0x002D,
106 0x305D, 0x308C, 0x305E, 0x308C, 0x306E, 0x5834, 0x6240, 0x0000
107 },
108 {
109 0x3072, 0x3068, 0x3064, 0x5C4B, 0x6839, 0x306E, 0x4E0B, 0x0032, 0x0000
110 },
111 {
112 0x004D, 0x0061, 0x006A, 0x0069, 0x3067, 0x004B, 0x006F, 0x0069, 0x3059,
113 0x308B, 0x0035, 0x79D2, 0x524D, 0x0000
114 },
115 {
116 0x30D1, 0x30D5, 0x30A3, 0x30FC, 0x0064, 0x0065, 0x30EB, 0x30F3, 0x30D0,
117 0x0000
118 },
119 {
120 0x305D, 0x306E, 0x30B9, 0x30D4, 0x30FC, 0x30C9, 0x3067, 0x0000
121 },
122 // test non-BMP code points
123 {
124 0xD800, 0xDF00, 0xD800, 0xDF01, 0xD800, 0xDF02, 0xD800, 0xDF03, 0xD800, 0xDF05,
125 0xD800, 0xDF06, 0xD800, 0xDF07, 0xD800, 0xDF09, 0xD800, 0xDF0A, 0xD800, 0xDF0B,
126 0x0000
127 },
128 {
129 0xD800, 0xDF0D, 0xD800, 0xDF0C, 0xD800, 0xDF1E, 0xD800, 0xDF0F, 0xD800, 0xDF16,
130 0xD800, 0xDF15, 0xD800, 0xDF14, 0xD800, 0xDF12, 0xD800, 0xDF10, 0xD800, 0xDF20,
131 0xD800, 0xDF21,
132 0x0000
133 },
134 // Greek
135 {
136 0x03b5, 0x03bb, 0x03bb, 0x03b7, 0x03bd, 0x03b9, 0x03ba, 0x03ac
137 },
138 // Maltese
139 {
140 0x0062, 0x006f, 0x006e, 0x0121, 0x0075, 0x0073, 0x0061, 0x0127,
141 0x0127, 0x0061
142 },
143 // Russian
144 {
145 0x043f, 0x043e, 0x0447, 0x0435, 0x043c, 0x0443, 0x0436, 0x0435,
146 0x043e, 0x043d, 0x0438, 0x043d, 0x0435, 0x0433, 0x043e, 0x0432,
147 0x043e, 0x0440, 0x044f, 0x0442, 0x043f, 0x043e, 0x0440, 0x0443,
148 0x0441, 0x0441, 0x043a, 0x0438
149 },
150 {
151 0xFB00, 0xFB01
152 }
153
154 };
155
156 static const char *asciiIn[] = {
157 "xn--egbpdaj6bu4bxfgehfvwxn",
158 "xn--ihqwcrb4cv8a8dqg056pqjye",
159 "xn--Proprostnemluvesky-uyb24dma41a",
160 "xn--4dbcagdahymbxekheh6e0a7fei0b",
161 "xn--i1baa7eci9glrd9b2ae1bj0hfcgg6iyaf8o0a1dig0cd",
162 "xn--n8jok5ay5dzabd5bym9f0cm5685rrjetr6pdxa",
163 /* "xn--989aomsvi5e83db1d2a355cv1e0vak1dwrv93d5xbh15a0dt30a5jpsd879ccm6fea98c",*/
164 "xn--b1abfaaepdrnnbgefbaDotcwatmq2g4l",
165 "xn--PorqunopuedensimplementehablarenEspaol-fmd56a",
166 "xn--ihqwctvzc91f659drss3x8bo0yb",
167 "xn--TisaohkhngthchnitingVit-kjcr8268qyxafd2f1b9g",
168 "xn--3B-ww4c5e180e575a65lsy2b",
169 "xn---with-SUPER-MONKEYS-pc58ag80a8qai00g7n9n",
170 "xn--Hello-Another-Way--fc4qua05auwb3674vfr0b",
171 "xn--2-u9tlzr9756bt3uc0v",
172 "xn--MajiKoi5-783gue6qz075azm5e",
173 "xn--de-jg4avhby1noc0d",
174 "xn--d9juau41awczczp",
175 "XN--097CCDEKGHQJK",
176 "XN--db8CBHEJLGH4E0AL",
177 "xn--hxargifdar", // Greek
178 "xn--bonusaa-5bb1da", // Maltese
179 "xn--b1abfaaepdrnnbgefbadotcwatmq2g4l", // Russian (Cyrillic)
180 "fffi"
181 };
182
183 static const char *domainNames[] = {
184 "slip129-37-118-146.nc.us.ibm.net",
185 "saratoga.pe.utexas.edu",
186 "dial-120-45.ots.utexas.edu",
187 "woo-085.dorms.waller.net",
188 "hd30-049.hil.compuserve.com",
189 "pem203-31.pe.ttu.edu",
190 "56K-227.MaxTNT3.pdq.net",
191 "dial-36-2.ots.utexas.edu",
192 "slip129-37-23-152.ga.us.ibm.net",
193 "ts45ip119.cadvision.com",
194 "sdn-ts-004txaustP05.dialsprint.net",
195 "bar-tnt1s66.erols.com",
196 "101.st-louis-15.mo.dial-access.att.net",
197 "h92-245.Arco.COM",
198 "dial-13-2.ots.utexas.edu",
199 "net-redynet29.datamarkets.com.ar",
200 "ccs-shiva28.reacciun.net.ve",
201 "7.houston-11.tx.dial-access.att.net",
202 "ingw129-37-120-26.mo.us.ibm.net",
203 "dialup6.austintx.com",
204 "dns2.tpao.gov.tr",
205 "slip129-37-119-194.nc.us.ibm.net",
206 "cs7.dillons.co.uk.203.119.193.in-addr.arpa",
207 "swprd1.innovplace.saskatoon.sk.ca",
208 "bikini.bologna.maraut.it",
209 "node91.subnet159-198-79.baxter.com",
210 "cust19.max5.new-york.ny.ms.uu.net",
211 "balexander.slip.andrew.cmu.edu",
212 "pool029.max2.denver.co.dynip.alter.net",
213 "cust49.max9.new-york.ny.ms.uu.net",
214 "s61.abq-dialin2.hollyberry.com",
215 "\\u0917\\u0928\\u0947\\u0936.sanjose.ibm.com", //':'(0x003a) produces U_IDNA_STD3_ASCII_RULES_ERROR
216 "www.xn--vea.com",
217 // "www.\\u00E0\\u00B3\\u00AF.com",//' ' (0x0020) produces U_IDNA_STD3_ASCII_RULES_ERROR
218 "www.\\u00C2\\u00A4.com",
219 "www.\\u00C2\\u00A3.com",
220 // "\\u0025", //'%' (0x0025) produces U_IDNA_STD3_ASCII_RULES_ERROR
221 // "\\u005C\\u005C", //'\' (0x005C) produces U_IDNA_STD3_ASCII_RULES_ERROR
222 //"@",
223 //"\\u002F",
224 //"www.\\u0021.com",
225 //"www.\\u0024.com",
226 //"\\u003f",
227 // These yeild U_IDNA_PROHIBITED_ERROR
228 //"\\u00CF\\u0082.com",
229 //"\\u00CE\\u00B2\\u00C3\\u009Fss.com",
230 //"\\u00E2\\u0098\\u00BA.com",
231 "\\u00C3\\u00BC.com",
232
233 };
234
235 typedef struct ErrorCases ErrorCases;
236
237 static const struct ErrorCases{
238
239 UChar unicode[100];
240 const char *ascii;
241 UErrorCode expected;
242 UBool useSTD3ASCIIRules;
243 UBool testToUnicode;
244 UBool testLabel;
245 } errorCases[] = {
246 {
247
248 {
249 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
250 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
251 0x070F,/*prohibited*/
252 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
253 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
254 0x0000
255 },
256 "www.XN--8mb5595fsoa28orucya378bqre2tcwop06c5qbw82a1rffmae0361dea96b.com",
257 U_IDNA_PROHIBITED_ERROR,
258 FALSE, FALSE, TRUE
259 },
260
261 {
262 {
263 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
264 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
265 0x0221, 0x0234/*Unassigned code points*/,
266 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
267 0x0000
268 },
269 "www.XN--6lA2Bz548Fj1GuA391Bf1Gb1N59Ab29A7iA.com",
270
271 U_IDNA_UNASSIGNED_ERROR,
272 FALSE, FALSE, TRUE
273 },
274 {
275 {
276 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
277 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
278 0x0644, 0x064A, 0x0647,/*Arabic code points. Cannot mix RTL with LTR*/
279 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
280 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
281 0x0000
282 },
283 "www.xn--ghBGI4851OiyA33VqrD6Az86C4qF83CtRv93D5xBk15AzfG0nAgA0578DeA71C.com",
284 U_IDNA_CHECK_BIDI_ERROR,
285 FALSE, FALSE, TRUE
286 },
287 {
288 {
289 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
290 /* labels cannot begin with an HYPHEN */
291 0x002D, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
292 0x002E,
293 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
294 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
295 0x0000
296
297 },
298 "www.xn----b95Ew8SqA315Ao5FbuMlnNmhA.com",
299 U_IDNA_STD3_ASCII_RULES_ERROR,
300 TRUE, FALSE, FALSE
301 },
302 {
303 {
304 /* correct ACE-prefix followed by unicode */
305 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
306 0x0078, 0x006e, 0x002d,0x002d, /* ACE Prefix */
307 0x002D, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
308 0x002D,
309 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
310 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
311 0x0000
312
313 },
314 /* wrong ACE-prefix followed by valid ACE-encoded ASCII */
315 "www.XY-----b91I0V65S96C2A355Cw1E5yCeQr19CsnP1mFfmAE0361DeA96B.com",
316 U_IDNA_ACE_PREFIX_ERROR,
317 FALSE, FALSE, FALSE
318 },
319 /* cannot verify U_IDNA_VERIFICATION_ERROR */
320
321 {
322 {
323 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
324 0xC138, 0xACC4, 0xC758, 0xBAA8, 0xB4E0, 0xC0AC, 0xB78C, 0xB4E4, 0xC774,
325 0xD55C, 0xAD6D, 0xC5B4, 0xB97C, 0xC774, 0xD574, 0xD55C, 0xB2E4, 0xBA74,
326 0xC5BC, 0xB9C8, 0xB098, 0xC88B, 0xC744, 0xAE4C,
327 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
328 0x0000
329 },
330 "www.xn--989AoMsVi5E83Db1D2A355Cv1E0vAk1DwRv93D5xBh15A0Dt30A5JpSD879Ccm6FeA98C.com",
331 U_IDNA_LABEL_TOO_LONG_ERROR,
332 FALSE, FALSE, TRUE
333 },
334
335 {
336 {
337 0x0077, 0x0077, 0x0077, 0x002e, /* www. */
338 0x0030, 0x0644, 0x064A, 0x0647, 0x0031, /* Arabic code points squashed between EN codepoints */
339 0x002e, 0x0063, 0x006f, 0x006d, /* com. */
340 0x0000
341 },
342 "www.xn--01-tvdmo.com",
343 U_IDNA_CHECK_BIDI_ERROR,
344 FALSE, FALSE, TRUE
345 },
346
347 {
348 {
349 0x0077, 0x0077, 0x0077, 0x002e, // www.
350 0x206C, 0x0644, 0x064A, 0x0647, 0x206D, // Arabic code points squashed between BN codepoints
351 0x002e, 0x0063, 0x006f, 0x006d, // com.
352 0x0000
353 },
354 "www.XN--ghbgi278xia.com",
355 U_IDNA_PROHIBITED_ERROR,
356 FALSE, FALSE, TRUE
357 },
358 {
359 {
360 0x0077, 0x0077, 0x0077, 0x002e, // www.
361 0x002D, 0x0041, 0x0042, 0x0043, 0x0044, 0x0045, // HYPHEN at the start of label
362 0x002e, 0x0063, 0x006f, 0x006d, // com.
363 0x0000
364 },
365 "www.-abcde.com",
366 U_IDNA_STD3_ASCII_RULES_ERROR,
367 TRUE, FALSE, FALSE
368 },
369 {
370 {
371 0x0077, 0x0077, 0x0077, 0x002e, // www.
372 0x0041, 0x0042, 0x0043, 0x0044, 0x0045,0x002D, // HYPHEN at the end of the label
373 0x002e, 0x0063, 0x006f, 0x006d, // com.
374 0x0000
375 },
376 "www.abcde-.com",
377 U_IDNA_STD3_ASCII_RULES_ERROR,
378 TRUE, FALSE, FALSE
379 },
380 {
381 {
382 0x0077, 0x0077, 0x0077, 0x002e, // www.
383 0x0041, 0x0042, 0x0043, 0x0044, 0x0045,0x0040, // Containing non LDH code point
384 0x002e, 0x0063, 0x006f, 0x006d, // com.
385 0x0000
386 },
387 "www.abcde@.com",
388 U_IDNA_STD3_ASCII_RULES_ERROR,
389 TRUE, FALSE, FALSE
390 },
391 {
392 {
393 0x0077, 0x0077, 0x0077, 0x002e, // www.
394 // zero length label
395 0x002e, 0x0063, 0x006f, 0x006d, // com.
396 0x0000
397 },
398 "www..com",
399 U_IDNA_ZERO_LENGTH_LABEL_ERROR,
400 TRUE, FALSE, FALSE
401 },
402 {
403 {0},
404 NULL,
405 U_ILLEGAL_ARGUMENT_ERROR,
406 TRUE, TRUE, FALSE
407 }
408 };
409
410
411
412
413 #define MAX_DEST_SIZE 300
414
debug(const UChar * src,int32_t srcLength,int32_t options)415 void TestIDNA::debug(const UChar* src, int32_t srcLength, int32_t options){
416 UParseError parseError;
417 UErrorCode transStatus = U_ZERO_ERROR;
418 UErrorCode prepStatus = U_ZERO_ERROR;
419 NamePrepTransform* trans = NamePrepTransform::createInstance(parseError,transStatus);
420 int32_t prepOptions = (((options & UIDNA_ALLOW_UNASSIGNED) != 0) ? USPREP_ALLOW_UNASSIGNED: 0);
421 LocalUStringPrepProfilePointer prep(usprep_openByType(USPREP_RFC3491_NAMEPREP,&prepStatus));
422 UChar *transOut=NULL, *prepOut=NULL;
423 int32_t transOutLength=0, prepOutLength=0;
424
425
426 transOutLength = trans->process(src,srcLength,transOut, 0, prepOptions>0, &parseError, transStatus);
427 if( transStatus == U_BUFFER_OVERFLOW_ERROR){
428 transStatus = U_ZERO_ERROR;
429 transOut = (UChar*) malloc(U_SIZEOF_UCHAR * transOutLength);
430 transOutLength = trans->process(src,srcLength,transOut, transOutLength, prepOptions>0, &parseError, transStatus);
431 }
432
433 prepOutLength = usprep_prepare(prep.getAlias(), src, srcLength, prepOut, 0, prepOptions, &parseError, &prepStatus);
434
435 if( prepStatus == U_BUFFER_OVERFLOW_ERROR){
436 prepStatus = U_ZERO_ERROR;
437 prepOut = (UChar*) malloc(U_SIZEOF_UCHAR * prepOutLength);
438 prepOutLength = usprep_prepare(prep.getAlias(), src, srcLength, prepOut, prepOutLength, prepOptions, &parseError, &prepStatus);
439 }
440
441 if(UnicodeString(transOut,transOutLength)!= UnicodeString(prepOut, prepOutLength)){
442 errln("Failed. Expected: " + prettify(UnicodeString(transOut, transOutLength))
443 + " Got: " + prettify(UnicodeString(prepOut,prepOutLength)));
444 }
445 free(transOut);
446 free(prepOut);
447 delete trans;
448 }
449
testAPI(const UChar * src,const UChar * expected,const char * testName,UBool useSTD3ASCIIRules,UErrorCode expectedStatus,UBool doCompare,UBool testUnassigned,TestFunc func,UBool testSTD3ASCIIRules)450 void TestIDNA::testAPI(const UChar* src, const UChar* expected, const char* testName,
451 UBool useSTD3ASCIIRules,UErrorCode expectedStatus,
452 UBool doCompare, UBool testUnassigned, TestFunc func, UBool testSTD3ASCIIRules){
453
454 UErrorCode status = U_ZERO_ERROR;
455 UChar destStack[MAX_DEST_SIZE];
456 int32_t destLen = 0;
457 UChar* dest = NULL;
458 int32_t expectedLen = (expected != NULL) ? u_strlen(expected) : 0;
459 int32_t options = (useSTD3ASCIIRules == TRUE) ? UIDNA_USE_STD3_RULES : UIDNA_DEFAULT;
460 UParseError parseError;
461 int32_t tSrcLen = 0;
462 UChar* tSrc = NULL;
463
464 if(src != NULL){
465 tSrcLen = u_strlen(src);
466 tSrc =(UChar*) malloc( U_SIZEOF_UCHAR * tSrcLen );
467 memcpy(tSrc,src,tSrcLen * U_SIZEOF_UCHAR);
468 }
469
470 // test null-terminated source and return value of number of UChars required
471 destLen = func(src,-1,NULL,0,options, &parseError , &status);
472 if(status == U_BUFFER_OVERFLOW_ERROR){
473 status = U_ZERO_ERROR; // reset error code
474 if(destLen+1 < MAX_DEST_SIZE){
475 dest = destStack;
476 destLen = func(src,-1,dest,destLen+1,options, &parseError, &status);
477 // TODO : compare output with expected
478 if(U_SUCCESS(status) && expectedStatus != U_IDNA_STD3_ASCII_RULES_ERROR&& (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
479 errln("Did not get the expected result for "+UnicodeString(testName) +" null terminated source. Expected : "
480 + prettify(UnicodeString(expected,expectedLen))
481 + " Got: " + prettify(UnicodeString(dest,destLen))
482 );
483 }
484 }else{
485 errln( "%s null terminated source failed. Requires destCapacity > 300\n",testName);
486 }
487 }
488
489 if(status != expectedStatus){
490 errcheckln(status, "Did not get the expected error for "+
491 UnicodeString(testName)+
492 " null terminated source. Expected: " +UnicodeString(u_errorName(expectedStatus))
493 + " Got: "+ UnicodeString(u_errorName(status))
494 + " Source: " + prettify(UnicodeString(src))
495 );
496 free(tSrc);
497 return;
498 }
499 if(testUnassigned ){
500 status = U_ZERO_ERROR;
501 destLen = func(src,-1,NULL,0,options | UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
502 if(status == U_BUFFER_OVERFLOW_ERROR){
503 status = U_ZERO_ERROR; // reset error code
504 if(destLen+1 < MAX_DEST_SIZE){
505 dest = destStack;
506 destLen = func(src,-1,dest,destLen+1,options | UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
507 // TODO : compare output with expected
508 if(U_SUCCESS(status) && (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
509 //errln("Did not get the expected result for %s null terminated source with both options set.\n",testName);
510 errln("Did not get the expected result for "+UnicodeString(testName) +
511 " null terminated source "+ prettify(src) +
512 " with both options set. Expected: "+ prettify(UnicodeString(expected,expectedLen))+
513 "Got: " + prettify(UnicodeString(dest,destLen)));
514
515 debug(src,-1,options | UIDNA_ALLOW_UNASSIGNED);
516
517 }
518 }else{
519 errln( "%s null terminated source failed. Requires destCapacity > 300\n",testName);
520 }
521 }
522 //testing query string
523 if(status != expectedStatus && expectedStatus != U_IDNA_UNASSIGNED_ERROR){
524 errln( "Did not get the expected error for "+
525 UnicodeString(testName)+
526 " null terminated source with options set. Expected: " +UnicodeString(u_errorName(expectedStatus))
527 + " Got: "+ UnicodeString(u_errorName(status))
528 + " Source: " + prettify(UnicodeString(src))
529 );
530 }
531 }
532
533 status = U_ZERO_ERROR;
534
535 // test source with lengthand return value of number of UChars required
536 destLen = func(tSrc, tSrcLen, NULL,0,options, &parseError, &status);
537 if(status == U_BUFFER_OVERFLOW_ERROR){
538 status = U_ZERO_ERROR; // reset error code
539 if(destLen+1 < MAX_DEST_SIZE){
540 dest = destStack;
541 destLen = func(src,u_strlen(src),dest,destLen+1,options, &parseError, &status);
542 // TODO : compare output with expected
543 if(U_SUCCESS(status) && (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
544 errln("Did not get the expected result for %s with source length.\n",testName);
545 }
546 }else{
547 errln( "%s with source length failed. Requires destCapacity > 300\n",testName);
548 }
549 }
550
551 if(status != expectedStatus){
552 errln( "Did not get the expected error for "+
553 UnicodeString(testName)+
554 " with source length. Expected: " +UnicodeString(u_errorName(expectedStatus))
555 + " Got: "+ UnicodeString(u_errorName(status))
556 + " Source: " + prettify(UnicodeString(src))
557 );
558 }
559 if(testUnassigned){
560 status = U_ZERO_ERROR;
561
562 destLen = func(tSrc,tSrcLen,NULL,0,options | UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
563
564 if(status == U_BUFFER_OVERFLOW_ERROR){
565 status = U_ZERO_ERROR; // reset error code
566 if(destLen+1 < MAX_DEST_SIZE){
567 dest = destStack;
568 destLen = func(src,u_strlen(src),dest,destLen+1,options | UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
569 // TODO : compare output with expected
570 if(U_SUCCESS(status) && (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
571 errln("Did not get the expected result for %s with source length and both options set.\n",testName);
572 }
573 }else{
574 errln( "%s with source length failed. Requires destCapacity > 300\n",testName);
575 }
576 }
577 //testing query string
578 if(status != expectedStatus && expectedStatus != U_IDNA_UNASSIGNED_ERROR){
579 errln( "Did not get the expected error for "+
580 UnicodeString(testName)+
581 " with source length and options set. Expected: " +UnicodeString(u_errorName(expectedStatus))
582 + " Got: "+ UnicodeString(u_errorName(status))
583 + " Source: " + prettify(UnicodeString(src))
584 );
585 }
586 }
587
588 status = U_ZERO_ERROR;
589 if(testSTD3ASCIIRules==TRUE){
590 destLen = func(src,-1,NULL,0,options | UIDNA_USE_STD3_RULES, &parseError, &status);
591 if(status == U_BUFFER_OVERFLOW_ERROR){
592 status = U_ZERO_ERROR; // reset error code
593 if(destLen+1 < MAX_DEST_SIZE){
594 dest = destStack;
595 destLen = func(src,-1,dest,destLen+1,options | UIDNA_USE_STD3_RULES, &parseError, &status);
596 // TODO : compare output with expected
597 if(U_SUCCESS(status) && (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
598 //errln("Did not get the expected result for %s null terminated source with both options set.\n",testName);
599 errln("Did not get the expected result for "+UnicodeString(testName) +" null terminated source with both options set. Expected: "+ prettify(UnicodeString(expected,expectedLen)));
600
601 }
602 }else{
603 errln( "%s null terminated source failed. Requires destCapacity > 300\n",testName);
604 }
605 }
606 //testing query string
607 if(status != expectedStatus){
608 errln( "Did not get the expected error for "+
609 UnicodeString(testName)+
610 " null terminated source with options set. Expected: " +UnicodeString(u_errorName(expectedStatus))
611 + " Got: "+ UnicodeString(u_errorName(status))
612 + " Source: " + prettify(UnicodeString(src))
613 );
614 }
615
616 status = U_ZERO_ERROR;
617
618 destLen = func(tSrc,tSrcLen,NULL,0,options | UIDNA_USE_STD3_RULES, &parseError, &status);
619
620 if(status == U_BUFFER_OVERFLOW_ERROR){
621 status = U_ZERO_ERROR; // reset error code
622 if(destLen+1 < MAX_DEST_SIZE){
623 dest = destStack;
624 destLen = func(src,u_strlen(src),dest,destLen+1,options | UIDNA_USE_STD3_RULES, &parseError, &status);
625 // TODO : compare output with expected
626 if(U_SUCCESS(status) && (doCompare==TRUE) && u_strCaseCompare(dest,destLen, expected,expectedLen,0,&status)!=0){
627 errln("Did not get the expected result for %s with source length and both options set.\n",testName);
628 }
629 }else{
630 errln( "%s with source length failed. Requires destCapacity > 300\n",testName);
631 }
632 }
633 //testing query string
634 if(status != expectedStatus && expectedStatus != U_IDNA_UNASSIGNED_ERROR){
635 errln( "Did not get the expected error for "+
636 UnicodeString(testName)+
637 " with source length and options set. Expected: " +UnicodeString(u_errorName(expectedStatus))
638 + " Got: "+ UnicodeString(u_errorName(status))
639 + " Source: " + prettify(UnicodeString(src))
640 );
641 }
642 }
643 free(tSrc);
644 }
645
testCompare(const UChar * s1,int32_t s1Len,const UChar * s2,int32_t s2Len,const char * testName,CompareFunc func,UBool isEqual)646 void TestIDNA::testCompare(const UChar* s1, int32_t s1Len,
647 const UChar* s2, int32_t s2Len,
648 const char* testName, CompareFunc func,
649 UBool isEqual){
650
651 UErrorCode status = U_ZERO_ERROR;
652 int32_t retVal = func(s1,-1,s2,-1,UIDNA_DEFAULT,&status);
653
654 if(isEqual==TRUE && retVal !=0){
655 errln("Did not get the expected result for %s with null termniated strings.\n",testName);
656 }
657 if(U_FAILURE(status)){
658 errcheckln(status, "%s null terminated source failed. Error: %s", testName,u_errorName(status));
659 }
660
661 status = U_ZERO_ERROR;
662 retVal = func(s1,-1,s2,-1,UIDNA_ALLOW_UNASSIGNED,&status);
663
664 if(isEqual==TRUE && retVal !=0){
665 errln("Did not get the expected result for %s with null termniated strings with options set.\n", testName);
666 }
667 if(U_FAILURE(status)){
668 errcheckln(status, "%s null terminated source and options set failed. Error: %s",testName, u_errorName(status));
669 }
670
671 status = U_ZERO_ERROR;
672 retVal = func(s1,s1Len,s2,s2Len,UIDNA_DEFAULT,&status);
673
674 if(isEqual==TRUE && retVal !=0){
675 errln("Did not get the expected result for %s with string length.\n",testName);
676 }
677 if(U_FAILURE(status)){
678 errcheckln(status, "%s with string length. Error: %s",testName, u_errorName(status));
679 }
680
681 status = U_ZERO_ERROR;
682 retVal = func(s1,s1Len,s2,s2Len,UIDNA_ALLOW_UNASSIGNED,&status);
683
684 if(isEqual==TRUE && retVal !=0){
685 errln("Did not get the expected result for %s with string length and options set.\n",testName);
686 }
687 if(U_FAILURE(status)){
688 errcheckln(status, "%s with string length and options set. Error: %s", u_errorName(status), testName);
689 }
690 }
691
testToASCII(const char * testName,TestFunc func)692 void TestIDNA::testToASCII(const char* testName, TestFunc func){
693
694 int32_t i;
695 UChar buf[MAX_DEST_SIZE];
696
697 for(i=0;i< (int32_t)(sizeof(unicodeIn)/sizeof(unicodeIn[0])); i++){
698 u_charsToUChars(asciiIn[i],buf, (int32_t)(strlen(asciiIn[i])+1));
699 testAPI(unicodeIn[i], buf,testName, FALSE,U_ZERO_ERROR, TRUE, TRUE, func);
700
701 }
702 }
703
testToUnicode(const char * testName,TestFunc func)704 void TestIDNA::testToUnicode(const char* testName, TestFunc func){
705
706 int32_t i;
707 UChar buf[MAX_DEST_SIZE];
708
709 for(i=0;i< (int32_t)(sizeof(asciiIn)/sizeof(asciiIn[0])); i++){
710 u_charsToUChars(asciiIn[i],buf, (int32_t)(strlen(asciiIn[i])+1));
711 testAPI(buf,unicodeIn[i],testName,FALSE,U_ZERO_ERROR, TRUE, TRUE, func);
712 }
713 }
714
715
testIDNToUnicode(const char * testName,TestFunc func)716 void TestIDNA::testIDNToUnicode(const char* testName, TestFunc func){
717 int32_t i;
718 UChar buf[MAX_DEST_SIZE];
719 UChar expected[MAX_DEST_SIZE];
720 UErrorCode status = U_ZERO_ERROR;
721 int32_t bufLen = 0;
722 UParseError parseError;
723 for(i=0;i< (int32_t)(sizeof(domainNames)/sizeof(domainNames[0])); i++){
724 bufLen = (int32_t)strlen(domainNames[i]);
725 bufLen = u_unescape(domainNames[i],buf, bufLen+1);
726 func(buf,bufLen,expected,MAX_DEST_SIZE, UIDNA_ALLOW_UNASSIGNED, &parseError,&status);
727 if(U_FAILURE(status)){
728 errcheckln(status, "%s failed to convert domainNames[%i].Error: %s",testName, i, u_errorName(status));
729 break;
730 }
731 testAPI(buf,expected,testName,FALSE,U_ZERO_ERROR, TRUE, TRUE, func);
732 //test toUnicode with all labels in the string
733 testAPI(buf,expected,testName, FALSE,U_ZERO_ERROR, TRUE, TRUE, func);
734 if(U_FAILURE(status)){
735 errln( "%s failed to convert domainNames[%i].Error: %s \n",testName,i, u_errorName(status));
736 break;
737 }
738 }
739
740 }
741
testIDNToASCII(const char * testName,TestFunc func)742 void TestIDNA::testIDNToASCII(const char* testName, TestFunc func){
743 int32_t i;
744 UChar buf[MAX_DEST_SIZE];
745 UChar expected[MAX_DEST_SIZE];
746 UErrorCode status = U_ZERO_ERROR;
747 int32_t bufLen = 0;
748 UParseError parseError;
749 for(i=0;i< (int32_t)(sizeof(domainNames)/sizeof(domainNames[0])); i++){
750 bufLen = (int32_t)strlen(domainNames[i]);
751 bufLen = u_unescape(domainNames[i],buf, bufLen+1);
752 func(buf,bufLen,expected,MAX_DEST_SIZE, UIDNA_ALLOW_UNASSIGNED, &parseError,&status);
753 if(U_FAILURE(status)){
754 errcheckln(status, "%s failed to convert domainNames[%i].Error: %s",testName,i, u_errorName(status));
755 break;
756 }
757 testAPI(buf,expected,testName, FALSE,U_ZERO_ERROR, TRUE, TRUE, func);
758 //test toASCII with all labels in the string
759 testAPI(buf,expected,testName, FALSE,U_ZERO_ERROR, FALSE, TRUE, func);
760 if(U_FAILURE(status)){
761 errln( "%s failed to convert domainNames[%i].Error: %s \n",testName,i, u_errorName(status));
762 break;
763 }
764 }
765
766 }
767
testCompare(const char * testName,CompareFunc func)768 void TestIDNA::testCompare(const char* testName, CompareFunc func){
769 int32_t i;
770
771
772 UChar www[] = {0x0057, 0x0057, 0x0057, 0x002E, 0x0000};
773 UChar com[] = {0x002E, 0x0043, 0x004F, 0x004D, 0x0000};
774 UChar buf[MAX_DEST_SIZE]={0x0057, 0x0057, 0x0057, 0x002E, 0x0000};
775
776 UnicodeString source(www), uni0(www),uni1(www), ascii0(www), ascii1(www);
777
778 uni0.append(unicodeIn[0]);
779 uni0.append(com);
780 uni0.append((UChar)0x0000);
781
782 uni1.append(unicodeIn[1]);
783 uni1.append(com);
784 uni1.append((UChar)0x0000);
785
786 ascii0.append(asciiIn[0]);
787 ascii0.append(com);
788 ascii0.append((UChar)0x0000);
789
790 ascii1.append(asciiIn[1]);
791 ascii1.append(com);
792 ascii1.append((UChar)0x0000);
793
794 for(i=0;i< (int32_t)(sizeof(unicodeIn)/sizeof(unicodeIn[0])); i++){
795
796 u_charsToUChars(asciiIn[i],buf+4, (int32_t)(strlen(asciiIn[i])+1));
797 u_strcat(buf,com);
798
799 // for every entry in unicodeIn array
800 // prepend www. and append .com
801 source.truncate(4);
802 source.append(unicodeIn[i]);
803 source.append(com);
804 source.append((UChar)0x0000);
805 // a) compare it with itself
806 const UChar* src = source.getBuffer();
807 int32_t srcLen = u_strlen(src); //subtract null
808
809 testCompare(src,srcLen,src,srcLen,testName, func, TRUE);
810
811 // b) compare it with asciiIn equivalent
812 testCompare(src,srcLen,buf,u_strlen(buf),testName, func,TRUE);
813
814 // c) compare it with unicodeIn not equivalent
815 if(i==0){
816 testCompare(src,srcLen,uni1.getBuffer(),uni1.length()-1,testName, func,FALSE);
817 }else{
818 testCompare(src,srcLen,uni0.getBuffer(),uni0.length()-1,testName, func,FALSE);
819 }
820 // d) compare it with asciiIn not equivalent
821 if(i==0){
822 testCompare(src,srcLen,ascii1.getBuffer(),ascii1.length()-1,testName, func,FALSE);
823 }else{
824 testCompare(src,srcLen,ascii0.getBuffer(),ascii0.length()-1,testName, func,FALSE);
825 }
826
827 }
828 }
829
830 #if 0
831
832 static int32_t
833 getNextSeperator(UChar *src,int32_t srcLength,
834 UChar **limit){
835 if(srcLength == -1){
836 int32_t i;
837 for(i=0 ; ;i++){
838 if(src[i] == 0){
839 *limit = src + i; // point to null
840 return i;
841 }
842 if(src[i]==0x002e){
843 *limit = src + (i+1); // go past the delimiter
844 return i;
845 }
846 }
847 // we have not found the delimiter
848 if(i==srcLength){
849 *limit = src+srcLength;
850 }
851 return i;
852 }else{
853 int32_t i;
854 for(i=0;i<srcLength;i++){
855 if(src[i]==0x002e){
856 *limit = src + (i+1); // go past the delimiter
857 return i;
858 }
859 }
860 // we have not found the delimiter
861 if(i==srcLength){
862 *limit = src+srcLength;
863 }
864 return i;
865 }
866 }
867
868 void printPunycodeOutput(){
869
870 UChar dest[MAX_DEST_SIZE];
871 int32_t destCapacity=MAX_DEST_SIZE;
872 UChar* start;
873 UChar* limit;
874 int32_t labelLen=0;
875 UBool caseFlags[MAX_DEST_SIZE];
876
877 for(int32_t i=0;i< sizeof(errorCases)/sizeof(errorCases[0]);i++){
878 ErrorCases errorCase = errorCases[i];
879 UErrorCode status = U_ZERO_ERROR;
880 start = errorCase.unicode;
881 int32_t srcLen = u_strlen(start);
882 labelLen = getNextSeperator(start,srcLen,&limit);
883 start = limit;
884 labelLen=getNextSeperator(start,srcLen-labelLen,&limit);
885 int32_t destLen = u_strToPunycode(dest,destCapacity,start,labelLen,caseFlags, &status);
886 if(U_FAILURE(status)){
887 printf("u_strToPunycode failed for index %i\n",i);
888 continue;
889 }
890 for(int32_t j=0; j<destLen; j++){
891 printf("%c",(char)dest[j]);
892 }
893 printf("\n");
894 }
895 }
896 #endif
897
testErrorCases(const char * IDNToASCIIName,TestFunc IDNToASCII,const char * IDNToUnicodeName,TestFunc IDNToUnicode)898 void TestIDNA::testErrorCases(const char* IDNToASCIIName, TestFunc IDNToASCII,
899 const char* IDNToUnicodeName, TestFunc IDNToUnicode){
900 UChar buf[MAX_DEST_SIZE];
901 int32_t bufLen=0;
902
903 for(int32_t i=0;i< (int32_t)(sizeof(errorCases)/sizeof(errorCases[0]));i++){
904 ErrorCases errorCase = errorCases[i];
905 UChar* src =NULL;
906 if(errorCase.ascii != NULL){
907 bufLen = (int32_t)strlen(errorCase.ascii);
908 u_charsToUChars(errorCase.ascii,buf, bufLen+1);
909 }else{
910 bufLen = 1 ;
911 memset(buf,0,U_SIZEOF_UCHAR*MAX_DEST_SIZE);
912 }
913
914 if(errorCase.unicode[0]!=0){
915 src = errorCase.unicode;
916 }
917 // test toASCII
918 testAPI(src,buf,
919 IDNToASCIIName, errorCase.useSTD3ASCIIRules,
920 errorCase.expected, TRUE, TRUE, IDNToASCII);
921 if(errorCase.testLabel ==TRUE){
922 testAPI(src,buf,
923 IDNToASCIIName, errorCase.useSTD3ASCIIRules,
924 errorCase.expected, FALSE,TRUE, IDNToASCII);
925 }
926 if(errorCase.testToUnicode ==TRUE){
927 testAPI((src==NULL)? NULL : buf,src,
928 IDNToUnicodeName, errorCase.useSTD3ASCIIRules,
929 errorCase.expected, TRUE, TRUE, IDNToUnicode);
930 }
931
932 }
933
934 }
935 /*
936 void TestIDNA::testConformance(const char* toASCIIName, TestFunc toASCII,
937 const char* IDNToASCIIName, TestFunc IDNToASCII,
938 const char* IDNToUnicodeName, TestFunc IDNToUnicode,
939 const char* toUnicodeName, TestFunc toUnicode){
940 UChar src[MAX_DEST_SIZE];
941 int32_t srcLen=0;
942 UChar expected[MAX_DEST_SIZE];
943 int32_t expectedLen = 0;
944 for(int32_t i=0;i< (int32_t)(sizeof(conformanceTestCases)/sizeof(conformanceTestCases[0]));i++){
945 const char* utf8Chars1 = conformanceTestCases[i].in;
946 int32_t utf8Chars1Len = (int32_t)strlen(utf8Chars1);
947 const char* utf8Chars2 = conformanceTestCases[i].out;
948 int32_t utf8Chars2Len = (utf8Chars2 == NULL) ? 0 : (int32_t)strlen(utf8Chars2);
949
950 UErrorCode status = U_ZERO_ERROR;
951 u_strFromUTF8(src,MAX_DEST_SIZE,&srcLen,utf8Chars1,utf8Chars1Len,&status);
952 if(U_FAILURE(status)){
953 errln(UnicodeString("Conversion of UTF8 source in conformanceTestCases[") + i +UnicodeString( "].in ( ")+prettify(utf8Chars1) +UnicodeString(" ) failed. Error: ")+ UnicodeString(u_errorName(status)));
954 continue;
955 }
956 if(utf8Chars2 != NULL){
957 u_strFromUTF8(expected,MAX_DEST_SIZE,&expectedLen,utf8Chars2,utf8Chars2Len, &status);
958 if(U_FAILURE(status)){
959 errln(UnicodeString("Conversion of UTF8 source in conformanceTestCases[") + i +UnicodeString( "].in ( ")+prettify(utf8Chars1) +UnicodeString(" ) failed. Error: ")+ UnicodeString(u_errorName(status)));
960 continue;
961 }
962 }
963
964 if(conformanceTestCases[i].expectedStatus != U_ZERO_ERROR){
965 // test toASCII
966 testAPI(src,expected,
967 IDNToASCIIName, FALSE,
968 conformanceTestCases[i].expectedStatus,
969 TRUE,
970 (conformanceTestCases[i].expectedStatus != U_IDNA_UNASSIGNED_ERROR),
971 IDNToASCII);
972
973 testAPI(src,expected,
974 toASCIIName, FALSE,
975 conformanceTestCases[i].expectedStatus, TRUE,
976 (conformanceTestCases[i].expectedStatus != U_IDNA_UNASSIGNED_ERROR),
977 toASCII);
978 }
979
980 testAPI(src,src,
981 IDNToUnicodeName, FALSE,
982 conformanceTestCases[i].expectedStatus, TRUE, TRUE, IDNToUnicode);
983 testAPI(src,src,
984 toUnicodeName, FALSE,
985 conformanceTestCases[i].expectedStatus, TRUE, TRUE, toUnicode);
986
987 }
988
989 }
990 */
991 // test and ascertain
992 // func(func(func(src))) == func(src)
testChaining(const UChar * src,int32_t numIterations,const char * testName,UBool useSTD3ASCIIRules,UBool caseInsensitive,TestFunc func)993 void TestIDNA::testChaining(const UChar* src,int32_t numIterations,const char* testName,
994 UBool useSTD3ASCIIRules, UBool caseInsensitive, TestFunc func){
995 UChar even[MAX_DEST_SIZE];
996 UChar odd[MAX_DEST_SIZE];
997 UChar expected[MAX_DEST_SIZE];
998 int32_t i=0,evenLen=0,oddLen=0,expectedLen=0;
999 UErrorCode status = U_ZERO_ERROR;
1000 int32_t srcLen = u_strlen(src);
1001 int32_t options = (useSTD3ASCIIRules == TRUE) ? UIDNA_USE_STD3_RULES : UIDNA_DEFAULT;
1002 UParseError parseError;
1003
1004 // test null-terminated source
1005 expectedLen = func(src,-1,expected,MAX_DEST_SIZE, options, &parseError, &status);
1006 if(U_FAILURE(status)){
1007 errcheckln(status, "%s null terminated source failed. Error: %s",testName, u_errorName(status));
1008 }
1009 memcpy(odd,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1010 memcpy(even,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1011 for(;i<=numIterations; i++){
1012 if((i%2) ==0){
1013 evenLen = func(odd,-1,even,MAX_DEST_SIZE,options, &parseError, &status);
1014 if(U_FAILURE(status)){
1015 errcheckln(status, "%s null terminated source failed - %s",testName, u_errorName(status));
1016 break;
1017 }
1018 }else{
1019 oddLen = func(even,-1,odd,MAX_DEST_SIZE,options, &parseError, &status);
1020 if(U_FAILURE(status)){
1021 errln("%s null terminated source failed\n",testName);
1022 break;
1023 }
1024 }
1025 }
1026 if(caseInsensitive ==TRUE){
1027 if( u_strCaseCompare(even,evenLen, expected,expectedLen, 0, &status) !=0 ||
1028 u_strCaseCompare(odd,oddLen, expected,expectedLen, 0, &status) !=0 ){
1029
1030 errln("Chaining for %s null terminated source failed\n",testName);
1031 }
1032 }else{
1033 if( u_strncmp(even,expected,expectedLen) != 0 ||
1034 u_strncmp(odd,expected,expectedLen) !=0 ){
1035
1036 errln("Chaining for %s null terminated source failed\n",testName);
1037 }
1038 }
1039
1040 // test null-terminated source
1041 status = U_ZERO_ERROR;
1042 expectedLen = func(src,-1,expected,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1043 if(U_FAILURE(status)){
1044 errcheckln(status, "%s null terminated source with options set failed. Error: %s",testName, u_errorName(status));
1045 }
1046 memcpy(odd,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1047 memcpy(even,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1048 for(;i<=numIterations; i++){
1049 if((i%2) ==0){
1050 evenLen = func(odd,-1,even,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1051 if(U_FAILURE(status)){
1052 errcheckln(status, "%s null terminated source with options set failed - %s",testName, u_errorName(status));
1053 break;
1054 }
1055 }else{
1056 oddLen = func(even,-1,odd,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1057 if(U_FAILURE(status)){
1058 errln("%s null terminated source with options set failed\n",testName);
1059 break;
1060 }
1061 }
1062 }
1063 if(caseInsensitive ==TRUE){
1064 if( u_strCaseCompare(even,evenLen, expected,expectedLen, 0, &status) !=0 ||
1065 u_strCaseCompare(odd,oddLen, expected,expectedLen, 0, &status) !=0 ){
1066
1067 errln("Chaining for %s null terminated source with options set failed\n",testName);
1068 }
1069 }else{
1070 if( u_strncmp(even,expected,expectedLen) != 0 ||
1071 u_strncmp(odd,expected,expectedLen) !=0 ){
1072
1073 errln("Chaining for %s null terminated source with options set failed\n",testName);
1074 }
1075 }
1076
1077
1078 // test source with length
1079 status = U_ZERO_ERROR;
1080 expectedLen = func(src,srcLen,expected,MAX_DEST_SIZE,options, &parseError, &status);
1081 if(U_FAILURE(status)){
1082 errcheckln(status, "%s null terminated source failed. Error: %s",testName, u_errorName(status));
1083 }
1084 memcpy(odd,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1085 memcpy(even,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1086 for(;i<=numIterations; i++){
1087 if((i%2) ==0){
1088 evenLen = func(odd,oddLen,even,MAX_DEST_SIZE,options, &parseError, &status);
1089 if(U_FAILURE(status)){
1090 errcheckln(status, "%s source with source length failed - %s",testName, u_errorName(status));
1091 break;
1092 }
1093 }else{
1094 oddLen = func(even,evenLen,odd,MAX_DEST_SIZE,options, &parseError, &status);
1095 if(U_FAILURE(status)){
1096 errcheckln(status, "%s source with source length failed - %s",testName, u_errorName(status));
1097 break;
1098 }
1099 }
1100 }
1101 if(caseInsensitive ==TRUE){
1102 if( u_strCaseCompare(even,evenLen, expected,expectedLen, 0, &status) !=0 ||
1103 u_strCaseCompare(odd,oddLen, expected,expectedLen, 0, &status) !=0 ){
1104
1105 errln("Chaining for %s source with source length failed\n",testName);
1106 }
1107 }else{
1108 if( u_strncmp(even,expected,expectedLen) != 0 ||
1109 u_strncmp(odd,expected,expectedLen) !=0 ){
1110
1111 errln("Chaining for %s source with source length failed\n",testName);
1112 }
1113 }
1114 status = U_ZERO_ERROR;
1115 expectedLen = func(src,srcLen,expected,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1116 if(U_FAILURE(status)){
1117 errcheckln(status, "%s null terminated source with options set failed. Error: %s",testName, u_errorName(status));
1118 }
1119 memcpy(odd,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1120 memcpy(even,expected,(expectedLen+1) * U_SIZEOF_UCHAR);
1121 for(;i<=numIterations; i++){
1122 if((i%2) ==0){
1123 evenLen = func(odd,oddLen,even,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1124 if(U_FAILURE(status)){
1125 errcheckln(status, "%s source with source length and options set failed - %s",testName, u_errorName(status));
1126 break;
1127 }
1128 }else{
1129 oddLen = func(even,evenLen,odd,MAX_DEST_SIZE,options|UIDNA_ALLOW_UNASSIGNED, &parseError, &status);
1130 if(U_FAILURE(status)){
1131 errcheckln(status, "%s source with source length and options set failed - %s",testName, u_errorName(status));
1132 break;
1133 }
1134 }
1135 }
1136 if(caseInsensitive ==TRUE){
1137 if( u_strCaseCompare(even,evenLen, expected,expectedLen, 0, &status) !=0 ||
1138 u_strCaseCompare(odd,oddLen, expected,expectedLen, 0, &status) !=0 ){
1139
1140 errln("Chaining for %s source with source length and options set failed\n",testName);
1141 }
1142 }else{
1143 if( u_strncmp(even,expected,expectedLen) != 0 ||
1144 u_strncmp(odd,expected,expectedLen) !=0 ){
1145
1146 errln("Chaining for %s source with source length and options set failed\n",testName);
1147 }
1148 }
1149 }
testChaining(const char * toASCIIName,TestFunc toASCII,const char * toUnicodeName,TestFunc toUnicode)1150 void TestIDNA::testChaining(const char* toASCIIName, TestFunc toASCII,
1151 const char* toUnicodeName, TestFunc toUnicode){
1152 int32_t i;
1153 UChar buf[MAX_DEST_SIZE];
1154
1155 for(i=0;i< (int32_t)(sizeof(asciiIn)/sizeof(asciiIn[0])); i++){
1156 u_charsToUChars(asciiIn[i],buf, (int32_t)(strlen(asciiIn[i])+1));
1157 testChaining(buf,5,toUnicodeName, FALSE, FALSE, toUnicode);
1158 }
1159 for(i=0;i< (int32_t)(sizeof(unicodeIn)/sizeof(unicodeIn[0])); i++){
1160 testChaining(unicodeIn[i], 5,toASCIIName, FALSE, TRUE, toASCII);
1161 }
1162 }
1163
1164
testRootLabelSeparator(const char * testName,CompareFunc func,const char * IDNToASCIIName,TestFunc IDNToASCII,const char * IDNToUnicodeName,TestFunc IDNToUnicode)1165 void TestIDNA::testRootLabelSeparator(const char* testName, CompareFunc func,
1166 const char* IDNToASCIIName, TestFunc IDNToASCII,
1167 const char* IDNToUnicodeName, TestFunc IDNToUnicode){
1168 int32_t i;
1169
1170
1171 UChar www[] = {0x0057, 0x0057, 0x0057, 0x002E, 0x0000};
1172 UChar com[] = {0x002E, 0x0043, 0x004F, 0x004D, 0x002E, /* root label separator */0x0000};
1173 UChar buf[MAX_DEST_SIZE]={0x0057, 0x0057, 0x0057, 0x002E, 0x0000};
1174
1175 UnicodeString source(www), uni0(www),uni1(www), ascii0(www), ascii1(www);
1176
1177 uni0.append(unicodeIn[0]);
1178 uni0.append(com);
1179 uni0.append((UChar)0x0000);
1180
1181 uni1.append(unicodeIn[1]);
1182 uni1.append(com);
1183 uni1.append((UChar)0x0000);
1184
1185 ascii0.append(asciiIn[0]);
1186 ascii0.append(com);
1187 ascii0.append((UChar)0x0000);
1188
1189 ascii1.append(asciiIn[1]);
1190 ascii1.append(com);
1191 ascii1.append((UChar)0x0000);
1192
1193 for(i=0;i< (int32_t)(sizeof(unicodeIn)/sizeof(unicodeIn[0])); i++){
1194
1195 u_charsToUChars(asciiIn[i],buf+4, (int32_t)(strlen(asciiIn[i])+1));
1196 u_strcat(buf,com);
1197
1198 // for every entry in unicodeIn array
1199 // prepend www. and append .com
1200 source.truncate(4);
1201 source.append(unicodeIn[i]);
1202 source.append(com);
1203 source.append((UChar)0x0000);
1204
1205 const UChar* src = source.getBuffer();
1206 int32_t srcLen = u_strlen(src); //subtract null
1207
1208 // b) compare it with asciiIn equivalent
1209 testCompare(src,srcLen,buf,u_strlen(buf),testName, func,TRUE);
1210
1211 // a) compare it with itself
1212 testCompare(src,srcLen,src,srcLen,testName, func,TRUE);
1213
1214
1215 // IDNToASCII comparison
1216 testAPI(src,buf,IDNToASCIIName,FALSE,U_ZERO_ERROR,TRUE, TRUE, IDNToASCII);
1217 // IDNToUnicode comparison
1218 testAPI(buf,src,IDNToUnicodeName, FALSE,U_ZERO_ERROR, TRUE, TRUE, IDNToUnicode);
1219
1220 // c) compare it with unicodeIn not equivalent
1221 if(i==0){
1222 testCompare(src,srcLen,uni1.getBuffer(),uni1.length()-1,testName, func,FALSE);
1223 }else{
1224 testCompare(src,srcLen,uni0.getBuffer(),uni0.length()-1,testName, func,FALSE);
1225 }
1226 // d) compare it with asciiIn not equivalent
1227 if(i==0){
1228 testCompare(src,srcLen,ascii1.getBuffer(),ascii1.length()-1,testName, func,FALSE);
1229 }else{
1230 testCompare(src,srcLen,ascii0.getBuffer(),ascii0.length()-1,testName, func,FALSE);
1231 }
1232 }
1233 }
1234
1235 //---------------------------------------------
1236 // runIndexedTest
1237 //---------------------------------------------
1238
1239 extern IntlTest *createUTS46Test();
1240
runIndexedTest(int32_t index,UBool exec,const char * & name,char * par)1241 void TestIDNA::runIndexedTest( int32_t index, UBool exec, const char* &name, char* par)
1242 {
1243 if (exec) logln((UnicodeString)"TestSuite IDNA API ");
1244 switch (index) {
1245
1246 case 0: name = "TestToASCII"; if (exec) TestToASCII(); break;
1247 case 1: name = "TestToUnicode"; if (exec) TestToUnicode(); break;
1248 case 2: name = "TestIDNToASCII"; if (exec) TestIDNToASCII(); break;
1249 case 3: name = "TestIDNToUnicode"; if (exec) TestIDNToUnicode(); break;
1250 case 4: name = "TestCompare"; if (exec) TestCompare(); break;
1251 case 5: name = "TestErrorCases"; if (exec) TestErrorCases(); break;
1252 case 6: name = "TestChaining"; if (exec) TestChaining(); break;
1253 case 7: name = "TestRootLabelSeparator"; if(exec) TestRootLabelSeparator(); break;
1254 case 8: name = "TestCompareReferenceImpl"; if(exec) TestCompareReferenceImpl(); break;
1255 case 9: name = "TestDataFile"; if(exec) TestDataFile(); break;
1256 #if !UCONFIG_NO_FILE_IO && !UCONFIG_NO_LEGACY_CONVERSION
1257 case 10: name = "TestRefIDNA"; if(exec) TestRefIDNA(); break;
1258 case 11: name = "TestIDNAMonkeyTest"; if(exec) TestIDNAMonkeyTest(); break;
1259 #else
1260 case 10: case 11: name = "skip"; break;
1261 #endif
1262 case 12:
1263 {
1264 name = "TestConformanceTestVectors";
1265 if(exec){
1266 logln("TestSuite IDNA conf----"); logln();
1267 IdnaConfTest test;
1268 callTest(test, par);
1269 }
1270 break;
1271 }
1272 case 13:
1273 name = "UTS46Test";
1274 if (exec) {
1275 logln("TestSuite UTS46Test---"); logln();
1276 LocalPointer<IntlTest> test(createUTS46Test());
1277 callTest(*test, par);
1278 }
1279 break;
1280 default: name = ""; break; /*needed to end loop*/
1281 }
1282 }
TestToASCII()1283 void TestIDNA::TestToASCII(){
1284 testToASCII("uidna_toASCII", uidna_toASCII);
1285 }
TestToUnicode()1286 void TestIDNA::TestToUnicode(){
1287 testToUnicode("uidna_toUnicode", uidna_toUnicode);
1288 }
TestIDNToASCII()1289 void TestIDNA::TestIDNToASCII(){
1290 testIDNToASCII("uidna_IDNToASCII", uidna_IDNToASCII);
1291 }
TestIDNToUnicode()1292 void TestIDNA::TestIDNToUnicode(){
1293 testIDNToUnicode("uidna_IDNToUnicode", uidna_IDNToUnicode);
1294 }
TestCompare()1295 void TestIDNA::TestCompare(){
1296 testCompare("uidna_compare",uidna_compare);
1297 }
TestErrorCases()1298 void TestIDNA::TestErrorCases(){
1299 testErrorCases( "uidna_IDNToASCII",uidna_IDNToASCII,
1300 "uidna_IDNToUnicode",uidna_IDNToUnicode);
1301 }
TestRootLabelSeparator()1302 void TestIDNA::TestRootLabelSeparator(){
1303 testRootLabelSeparator( "uidna_compare",uidna_compare,
1304 "uidna_IDNToASCII", uidna_IDNToASCII,
1305 "uidna_IDNToUnicode",uidna_IDNToUnicode
1306 );
1307 }
TestChaining()1308 void TestIDNA::TestChaining(){
1309 testChaining("uidna_toASCII",uidna_toASCII, "uidna_toUnicode", uidna_toUnicode);
1310 }
1311
1312
1313 static const int loopCount = 100;
1314 static const int maxCharCount = 20;
1315 static const int maxCodePoint = 0x10ffff;
1316 static uint32_t
randul()1317 randul()
1318 {
1319 static UBool initialized = FALSE;
1320 if (!initialized)
1321 {
1322 srand((unsigned)time(NULL));
1323 initialized = TRUE;
1324 }
1325 // Assume rand has at least 12 bits of precision
1326 uint32_t l = 0;
1327 for (uint32_t i=0; i<sizeof(l); ++i)
1328 ((char*)&l)[i] = (char)((rand() & 0x0FF0) >> 4);
1329 return l;
1330 }
1331
1332 /**
1333 * Return a random integer i where 0 <= i < n.
1334 * A special function that gets random codepoints from planes 0,1,2 and 14
1335 */
rand_uni()1336 static int32_t rand_uni()
1337 {
1338 int32_t retVal = (int32_t)(randul()& 0x3FFFF);
1339 if(retVal >= 0x30000){
1340 retVal+=0xB0000;
1341 }
1342 return retVal;
1343 }
1344
randi(int32_t n)1345 static int32_t randi(int32_t n){
1346 return (int32_t) (randul() % (n+1));
1347 }
1348
getTestSource(UnicodeString & fillIn)1349 void getTestSource(UnicodeString& fillIn) {
1350 int32_t i = 0;
1351 int32_t charCount = (randi(maxCharCount) + 1);
1352 while (i <charCount ) {
1353 int32_t codepoint = rand_uni();
1354 if(codepoint == 0x0000){
1355 continue;
1356 }
1357 fillIn.append((UChar32)codepoint);
1358 i++;
1359 }
1360
1361 }
1362
testCompareReferenceImpl(UnicodeString & src,TestFunc refIDNA,const char * refIDNAName,TestFunc uIDNA,const char * uIDNAName,int32_t options)1363 UnicodeString TestIDNA::testCompareReferenceImpl(UnicodeString& src,
1364 TestFunc refIDNA, const char* refIDNAName,
1365 TestFunc uIDNA, const char* uIDNAName,
1366 int32_t options){
1367
1368 const UChar* srcUChars = src.getBuffer();
1369 UChar exp[MAX_DEST_SIZE]={0};
1370 int32_t expCap = MAX_DEST_SIZE, expLen=0;
1371 UErrorCode expStatus = U_ZERO_ERROR;
1372 UParseError parseError;
1373
1374 logln("Comparing "+ UnicodeString(refIDNAName)
1375 + " with "+ UnicodeString(uIDNAName)
1376 +" for input: " + prettify(srcUChars));
1377
1378 expLen = refIDNA(srcUChars, src.length()-1, exp, expCap,
1379 options, &parseError, &expStatus);
1380
1381 UChar got[MAX_DEST_SIZE]={0};
1382 int32_t gotCap = MAX_DEST_SIZE, gotLen=0;
1383 UErrorCode gotStatus = U_ZERO_ERROR;
1384
1385 gotLen = uIDNA(srcUChars, src.length()-1, got, gotCap,
1386 options, &parseError, &gotStatus);
1387
1388 if(expStatus != gotStatus){
1389 errln("Did not get the expected status while comparing " + UnicodeString(refIDNAName)
1390 + " with " + UnicodeString(uIDNAName)
1391 + " Expected: " + UnicodeString(u_errorName(expStatus))
1392 + " Got: " + UnicodeString(u_errorName(gotStatus))
1393 + " for Source: "+ prettify(srcUChars)
1394 + " Options: " + options);
1395 return UnicodeString("");
1396 }
1397
1398 // now we know that both implementations yielded same error
1399 if(U_SUCCESS(expStatus)){
1400 // compare the outputs if status == U_ZERO_ERROR
1401 if(u_strCompare(exp, expLen, got, gotLen, TRUE) != 0){
1402 errln("Did not get the expected output while comparing " + UnicodeString(refIDNAName)
1403 + " with " + UnicodeString(uIDNAName)
1404 + " Expected: " + prettify(UnicodeString(exp, expLen))
1405 + " Got: " + prettify(UnicodeString(got, gotLen))
1406 + " for Source: "+ prettify(srcUChars)
1407 + " Options: " + options);
1408 }
1409 return UnicodeString(exp, expLen);
1410
1411 }else{
1412 logln("Got the same error while comparing "
1413 + UnicodeString(refIDNAName)
1414 + " with "+ UnicodeString(uIDNAName)
1415 +" for input: " + prettify(srcUChars));
1416 }
1417 return UnicodeString("");
1418 }
1419
testCompareReferenceImpl(const UChar * src,int32_t srcLen)1420 void TestIDNA::testCompareReferenceImpl(const UChar* src, int32_t srcLen){
1421 UnicodeString label(src,srcLen);
1422 label.append((UChar)0x0000);
1423
1424 //test idnaref_toASCII and idnare
1425 UnicodeString asciiLabel = testCompareReferenceImpl(label,
1426 idnaref_toASCII, "idnaref_toASCII",
1427 uidna_toASCII, "uidna_toASCII",
1428 UIDNA_ALLOW_UNASSIGNED);
1429 testCompareReferenceImpl(label,
1430 idnaref_toASCII, "idnaref_toASCII",
1431 uidna_toASCII, "uidna_toASCII",
1432 UIDNA_DEFAULT);
1433 testCompareReferenceImpl(label,
1434 idnaref_toASCII, "idnaref_toASCII",
1435 uidna_toASCII, "uidna_toASCII",
1436 UIDNA_USE_STD3_RULES);
1437 testCompareReferenceImpl(label,
1438 idnaref_toASCII, "idnaref_toASCII",
1439 uidna_toASCII, "uidna_toASCII",
1440 UIDNA_USE_STD3_RULES | UIDNA_ALLOW_UNASSIGNED);
1441
1442 if(asciiLabel.length()!=0){
1443 asciiLabel.append((UChar)0x0000);
1444
1445 // test toUnciode
1446 testCompareReferenceImpl(asciiLabel,
1447 idnaref_toUnicode, "idnaref_toUnicode",
1448 uidna_toUnicode, "uidna_toUnicode",
1449 UIDNA_ALLOW_UNASSIGNED);
1450 testCompareReferenceImpl(asciiLabel,
1451 idnaref_toUnicode, "idnaref_toUnicode",
1452 uidna_toUnicode, "uidna_toUnicode",
1453 UIDNA_DEFAULT);
1454 testCompareReferenceImpl(asciiLabel,
1455 idnaref_toUnicode, "idnaref_toUnicode",
1456 uidna_toUnicode, "uidna_toUnicode",
1457 UIDNA_USE_STD3_RULES);
1458 testCompareReferenceImpl(asciiLabel,
1459 idnaref_toUnicode, "idnaref_toUnicode",
1460 uidna_toUnicode, "uidna_toUnicode",
1461 UIDNA_USE_STD3_RULES | UIDNA_ALLOW_UNASSIGNED);
1462 }
1463
1464 }
1465 const char* failures[] ={
1466 "\\uAA42\\U0001F8DD\\U00019D01\\U000149A3\\uD385\\U000EE0F5\\U00018B92\\U000179D1\\U00018624\\U0002227F\\U000E83C0\\U000E8DCD\\u5460\\U00017F34\\U0001570B\\u43D1\\U0002C9C9\\U000281EC\\u2105\\U000180AE\\uC5D4",
1467 "\\U0002F5A6\\uD638\\u0D0A\\u9E9C\\uFE5B\\U0001FCCB\\u66C4",
1468 };
1469
TestIDNAMonkeyTest()1470 void TestIDNA::TestIDNAMonkeyTest(){
1471 UnicodeString source;
1472 UErrorCode status = U_ZERO_ERROR;
1473 int i;
1474
1475 getInstance(status); // Init prep
1476 if (U_FAILURE(status)) {
1477 dataerrln("Test could not initialize. Got %s", u_errorName(status));
1478 return;
1479 }
1480
1481 for(i=0; i<loopCount; i++){
1482 source.truncate(0);
1483 getTestSource(source);
1484 source.append((UChar)0x0000);
1485 const UChar* src = source.getBuffer();
1486 testCompareReferenceImpl(src,source.length()-1);
1487 testCompareReferenceImpl(src,source.length()-1);
1488 }
1489
1490 /* for debugging */
1491 for (i=0; i<(int)(sizeof(failures)/sizeof(failures[0])); i++){
1492 source.truncate(0);
1493 source.append( UnicodeString(failures[i], -1, US_INV) );
1494 source = source.unescape();
1495 source.append((UChar)0x0000);
1496 const UChar *src = source.getBuffer();
1497 testCompareReferenceImpl(src,source.length()-1);
1498 //debug(source.getBuffer(),source.length(),UIDNA_ALLOW_UNASSIGNED);
1499 }
1500
1501
1502 source.truncate(0);
1503 source.append(UNICODE_STRING_SIMPLE("\\uCF18\\U00021161\\U000EEF11\\U0002BB82\\U0001D63C"));
1504 debug(source.getBuffer(),source.length(),UIDNA_ALLOW_UNASSIGNED);
1505
1506 { // test deletion of code points
1507 UnicodeString source("\\u043f\\u00AD\\u034f\\u043e\\u0447\\u0435\\u043c\\u0443\\u0436\\u0435\\u043e\\u043d\\u0438\\u043d\\u0435\\u0433\\u043e\\u0432\\u043e\\u0440\\u044f\\u0442\\u043f\\u043e\\u0440\\u0443\\u0441\\u0441\\u043a\\u0438\\u0000", -1, US_INV);
1508 source = source.unescape();
1509 UnicodeString expected("\\u043f\\u043e\\u0447\\u0435\\u043c\\u0443\\u0436\\u0435\\u043e\\u043d\\u0438\\u043d\\u0435\\u0433\\u043e\\u0432\\u043e\\u0440\\u044f\\u0442\\u043f\\u043e\\u0440\\u0443\\u0441\\u0441\\u043a\\u0438\\u0000", -1, US_INV);
1510 expected = expected.unescape();
1511 UnicodeString ascii("xn--b1abfaaepdrnnbgefbadotcwatmq2g4l");
1512 ascii.append((UChar)0x0000);
1513 testAPI(source.getBuffer(),ascii.getBuffer(), "uidna_toASCII", FALSE, U_ZERO_ERROR, TRUE, TRUE, uidna_toASCII);
1514
1515 testAPI(source.getBuffer(),ascii.getBuffer(), "idnaref_toASCII", FALSE, U_ZERO_ERROR, TRUE, TRUE, idnaref_toASCII);
1516
1517 testCompareReferenceImpl(source.getBuffer(), source.length()-1);
1518 }
1519
1520 }
1521
TestCompareReferenceImpl()1522 void TestIDNA::TestCompareReferenceImpl(){
1523
1524 UChar src [2] = {0,0};
1525 int32_t srcLen = 0;
1526
1527 // data even OK?
1528 {
1529 UErrorCode dataStatus = U_ZERO_ERROR;
1530 loadTestData(dataStatus);
1531 if(U_FAILURE(dataStatus)) {
1532 dataerrln("Couldn't load test data: %s\n", u_errorName(dataStatus)); // save us from thousands and thousands of errors
1533 return;
1534 }
1535 }
1536
1537 for (int32_t i = 0; i <= 0x10FFFF; i++){
1538 if (quick == TRUE && i > 0x0FFF){
1539 return;
1540 }
1541 if(i == 0x30000){
1542 // jump to E0000, no characters assigned in plain 3 to plain 13 as of Unicode 6.0
1543 i = 0xE0000;
1544 }
1545 if (i > 0xFFFF){
1546 src[0] = U16_LEAD(i);
1547 src[1] = U16_TRAIL(i);
1548 srcLen =2;
1549 } else {
1550 src[0] = (UChar)i;
1551 src[1] = 0;
1552 srcLen = 1;
1553 }
1554 testCompareReferenceImpl(src, srcLen);
1555 }
1556 }
1557
TestRefIDNA()1558 void TestIDNA::TestRefIDNA(){
1559 UErrorCode status = U_ZERO_ERROR;
1560 getInstance(status); // Init prep
1561 if (U_FAILURE(status)) {
1562 if (status == U_FILE_ACCESS_ERROR) {
1563 dataerrln("Test could not initialize. Got %s", u_errorName(status));
1564 }
1565 return;
1566 }
1567
1568 testToASCII("idnaref_toASCII", idnaref_toASCII);
1569 testToUnicode("idnaref_toUnicode", idnaref_toUnicode);
1570 testIDNToASCII("idnaref_IDNToASCII", idnaref_IDNToASCII);
1571 testIDNToUnicode("idnaref_IDNToUnicode", idnaref_IDNToUnicode);
1572 testCompare("idnaref_compare",idnaref_compare);
1573 testErrorCases( "idnaref_IDNToASCII",idnaref_IDNToASCII,
1574 "idnaref_IDNToUnicode",idnaref_IDNToUnicode);
1575 testChaining("idnaref_toASCII",idnaref_toASCII, "idnaref_toUnicode", idnaref_toUnicode);
1576
1577 testRootLabelSeparator( "idnaref_compare",idnaref_compare,
1578 "idnaref_IDNToASCII", idnaref_IDNToASCII,
1579 "idnaref_IDNToUnicode",idnaref_IDNToUnicode
1580 );
1581 testChaining("idnaref_toASCII",idnaref_toASCII, "idnaref_toUnicode", idnaref_toUnicode);
1582 }
1583
1584
TestDataFile()1585 void TestIDNA::TestDataFile(){
1586 testData(*this);
1587 }
~TestIDNA()1588 TestIDNA::~TestIDNA(){
1589 if(gPrep!=NULL){
1590 delete gPrep;
1591 gPrep = NULL;
1592 }
1593 }
1594
1595 NamePrepTransform* TestIDNA::gPrep = NULL;
1596
getInstance(UErrorCode & status)1597 NamePrepTransform* TestIDNA::getInstance(UErrorCode& status){
1598 if(TestIDNA::gPrep == NULL){
1599 UParseError parseError;
1600 TestIDNA::gPrep = NamePrepTransform::createInstance(parseError, status);
1601 if(TestIDNA::gPrep ==NULL){
1602 //status = U_MEMORY_ALLOCATION_ERROR;
1603 return NULL;
1604 }
1605 }
1606 return TestIDNA::gPrep;
1607
1608 }
1609 #endif /* #if !UCONFIG_NO_IDNA */
1610