OLD | NEW |
| (Empty) |
1 /* | |
2 ****************************************************************************** | |
3 * | |
4 * Copyright (C) 2001-2011, International Business Machines | |
5 * Corporation and others. All Rights Reserved. | |
6 * | |
7 ****************************************************************************** | |
8 * file name: trietest.c | |
9 * encoding: US-ASCII | |
10 * tab size: 8 (not used) | |
11 * indentation:4 | |
12 * | |
13 * created on: 2001nov20 | |
14 * created by: Markus W. Scherer | |
15 */ | |
16 | |
17 #include <stdio.h> | |
18 #include "unicode/utypes.h" | |
19 #include "unicode/utf16.h" | |
20 #include "utrie.h" | |
21 #include "cstring.h" | |
22 #include "cmemory.h" | |
23 | |
24 #if 1 | |
25 #include "cintltst.h" | |
26 #else | |
27 /* definitions from standalone utrie development */ | |
28 #define log_err printf | |
29 #define log_verbose printf | |
30 | |
31 #undef u_errorName | |
32 #define u_errorName(errorCode) "some error code" | |
33 #endif | |
34 | |
35 #define ARRAY_LENGTH(array) (sizeof(array)/sizeof(array[0])) | |
36 | |
37 /* Values for setting possibly overlapping, out-of-order ranges of values */ | |
38 typedef struct SetRange { | |
39 UChar32 start, limit; | |
40 uint32_t value; | |
41 UBool overwrite; | |
42 } SetRange; | |
43 | |
44 /* | |
45 * Values for testing: | |
46 * value is set from the previous boundary's limit to before | |
47 * this boundary's limit | |
48 */ | |
49 typedef struct CheckRange { | |
50 UChar32 limit; | |
51 uint32_t value; | |
52 } CheckRange; | |
53 | |
54 | |
55 static uint32_t U_CALLCONV | |
56 _testFoldedValue32(UNewTrie *trie, UChar32 start, int32_t offset) { | |
57 uint32_t foldedValue, value; | |
58 UChar32 limit; | |
59 UBool inBlockZero; | |
60 | |
61 foldedValue=0; | |
62 | |
63 limit=start+0x400; | |
64 while(start<limit) { | |
65 value=utrie_get32(trie, start, &inBlockZero); | |
66 if(inBlockZero) { | |
67 start+=UTRIE_DATA_BLOCK_LENGTH; | |
68 } else { | |
69 foldedValue|=value; | |
70 ++start; | |
71 } | |
72 } | |
73 | |
74 if(foldedValue!=0) { | |
75 return ((uint32_t)offset<<16)|foldedValue; | |
76 } else { | |
77 return 0; | |
78 } | |
79 } | |
80 | |
81 static int32_t U_CALLCONV | |
82 _testFoldingOffset32(uint32_t data) { | |
83 return (int32_t)(data>>16); | |
84 } | |
85 | |
86 static uint32_t U_CALLCONV | |
87 _testFoldedValue16(UNewTrie *trie, UChar32 start, int32_t offset) { | |
88 uint32_t foldedValue, value; | |
89 UChar32 limit; | |
90 UBool inBlockZero; | |
91 | |
92 foldedValue=0; | |
93 | |
94 limit=start+0x400; | |
95 while(start<limit) { | |
96 value=utrie_get32(trie, start, &inBlockZero); | |
97 if(inBlockZero) { | |
98 start+=UTRIE_DATA_BLOCK_LENGTH; | |
99 } else { | |
100 foldedValue|=value; | |
101 ++start; | |
102 } | |
103 } | |
104 | |
105 if(foldedValue!=0) { | |
106 return (uint32_t)(offset|0x8000); | |
107 } else { | |
108 return 0; | |
109 } | |
110 } | |
111 | |
112 static int32_t U_CALLCONV | |
113 _testFoldingOffset16(uint32_t data) { | |
114 if(data&0x8000) { | |
115 return (int32_t)(data&0x7fff); | |
116 } else { | |
117 return 0; | |
118 } | |
119 } | |
120 | |
121 static uint32_t U_CALLCONV | |
122 _testEnumValue(const void *context, uint32_t value) { | |
123 return value^0x5555; | |
124 } | |
125 | |
126 static UBool U_CALLCONV | |
127 _testEnumRange(const void *context, UChar32 start, UChar32 limit, uint32_t value
) { | |
128 const CheckRange **pb=(const CheckRange **)context; | |
129 const CheckRange *b=(*pb)++; | |
130 | |
131 value^=0x5555; | |
132 if(start!=(b-1)->limit || limit!=b->limit || value!=b->value) { | |
133 log_err("error: utrie_enum() delivers wrong range [U+%04lx..U+%04lx[.0x%
lx instead of [U+%04lx..U+%04lx[.0x%lx\n", | |
134 start, limit, value, | |
135 (b-1)->limit, b->limit, b->value); | |
136 } | |
137 return TRUE; | |
138 } | |
139 | |
140 static void | |
141 testTrieIteration(const char *testName, | |
142 const UTrie *trie, | |
143 const CheckRange checkRanges[], int32_t countCheckRanges) { | |
144 UChar s[100]; | |
145 uint32_t values[30]; | |
146 | |
147 const UChar *p, *limit; | |
148 | |
149 uint32_t value; | |
150 UChar32 c; | |
151 int32_t i, length, countValues; | |
152 UChar c2; | |
153 | |
154 /* write a string */ | |
155 length=countValues=0; | |
156 for(i=0; i<countCheckRanges; ++i) { | |
157 c=checkRanges[i].limit; | |
158 if(c!=0) { | |
159 --c; | |
160 U16_APPEND_UNSAFE(s, length, c); | |
161 values[countValues++]=checkRanges[i].value; | |
162 } | |
163 } | |
164 limit=s+length; | |
165 | |
166 /* try forward */ | |
167 p=s; | |
168 i=0; | |
169 while(p<limit) { | |
170 c=c2=0x33; | |
171 if(trie->data32!=NULL) { | |
172 UTRIE_NEXT32(trie, p, limit, c, c2, value); | |
173 } else { | |
174 UTRIE_NEXT16(trie, p, limit, c, c2, value); | |
175 } | |
176 if(value!=values[i]) { | |
177 log_err("error: wrong value from UTRIE_NEXT(%s)(U+%04lx, U+%04lx): 0
x%lx instead of 0x%lx\n", | |
178 testName, c, c2, value, values[i]); | |
179 } | |
180 if( | |
181 c2==0 ? | |
182 c!=*(p-1) : | |
183 !U16_IS_LEAD(c) || !U16_IS_TRAIL(c2) || c!=*(p-2) || c2!=*(p-1) | |
184 ) { | |
185 log_err("error: wrong (c, c2) from UTRIE_NEXT(%s): (U+%04lx, U+%04lx
)\n", | |
186 testName, c, c2); | |
187 continue; | |
188 } | |
189 if(c2!=0) { | |
190 int32_t offset; | |
191 | |
192 if(trie->data32==NULL) { | |
193 value=UTRIE_GET16_FROM_LEAD(trie, c); | |
194 offset=trie->getFoldingOffset(value); | |
195 if(offset>0) { | |
196 value=UTRIE_GET16_FROM_OFFSET_TRAIL(trie, offset, c2); | |
197 } else { | |
198 value=trie->initialValue; | |
199 } | |
200 } else { | |
201 value=UTRIE_GET32_FROM_LEAD(trie, c); | |
202 offset=trie->getFoldingOffset(value); | |
203 if(offset>0) { | |
204 value=UTRIE_GET32_FROM_OFFSET_TRAIL(trie, offset, c2); | |
205 } else { | |
206 value=trie->initialValue; | |
207 } | |
208 } | |
209 if(value!=values[i]) { | |
210 log_err("error: wrong value from UTRIE_GETXX_FROM_OFFSET_TRAIL(%
s)(U+%04lx, U+%04lx): 0x%lx instead of 0x%lx\n", | |
211 testName, c, c2, value, values[i]); | |
212 } | |
213 } | |
214 if(c2!=0) { | |
215 value=0x44; | |
216 if(trie->data32==NULL) { | |
217 UTRIE_GET16_FROM_PAIR(trie, c, c2, value); | |
218 } else { | |
219 UTRIE_GET32_FROM_PAIR(trie, c, c2, value); | |
220 } | |
221 if(value!=values[i]) { | |
222 log_err("error: wrong value from UTRIE_GETXX_FROM_PAIR(%s)(U+%04
lx, U+%04lx): 0x%lx instead of 0x%lx\n", | |
223 testName, c, c2, value, values[i]); | |
224 } | |
225 } | |
226 ++i; | |
227 } | |
228 | |
229 /* try backward */ | |
230 p=limit; | |
231 i=countValues; | |
232 while(s<p) { | |
233 --i; | |
234 c=c2=0x33; | |
235 if(trie->data32!=NULL) { | |
236 UTRIE_PREVIOUS32(trie, s, p, c, c2, value); | |
237 } else { | |
238 UTRIE_PREVIOUS16(trie, s, p, c, c2, value); | |
239 } | |
240 if(value!=values[i]) { | |
241 log_err("error: wrong value from UTRIE_PREVIOUS(%s)(U+%04lx, U+%04lx
): 0x%lx instead of 0x%lx\n", | |
242 testName, c, c2, value, values[i]); | |
243 } | |
244 if( | |
245 c2==0 ? | |
246 c!=*p: | |
247 !U16_IS_LEAD(c) || !U16_IS_TRAIL(c2) || c!=*p || c2!=*(p+1) | |
248 ) { | |
249 log_err("error: wrong (c, c2) from UTRIE_PREVIOUS(%s): (U+%04lx, U+%
04lx)\n", | |
250 testName, c, c2); | |
251 } | |
252 } | |
253 } | |
254 | |
255 static void | |
256 testTrieRangesWithMalloc(const char *testName, | |
257 const SetRange setRanges[], int32_t countSetRanges, | |
258 const CheckRange checkRanges[], int32_t countCheckRanges, | |
259 UBool dataIs32, UBool latin1Linear) { | |
260 UTrieGetFoldingOffset *getFoldingOffset; | |
261 const CheckRange *enumRanges; | |
262 UNewTrie *newTrie; | |
263 UTrie trie={ 0 }; | |
264 uint32_t value, value2; | |
265 UChar32 start, limit; | |
266 int32_t i, length; | |
267 UErrorCode errorCode; | |
268 UBool overwrite, ok; | |
269 uint8_t* storage =NULL; | |
270 static const int32_t DEFAULT_STORAGE_SIZE = 32768; | |
271 storage = (uint8_t*) uprv_malloc(sizeof(uint8_t)*DEFAULT_STORAGE_SIZE); | |
272 | |
273 log_verbose("\ntesting Trie '%s'\n", testName); | |
274 newTrie=utrie_open(NULL, NULL, 2000, | |
275 checkRanges[0].value, checkRanges[0].value, | |
276 latin1Linear); | |
277 | |
278 /* set values from setRanges[] */ | |
279 ok=TRUE; | |
280 for(i=0; i<countSetRanges; ++i) { | |
281 start=setRanges[i].start; | |
282 limit=setRanges[i].limit; | |
283 value=setRanges[i].value; | |
284 overwrite=setRanges[i].overwrite; | |
285 if((limit-start)==1 && overwrite) { | |
286 ok&=utrie_set32(newTrie, start, value); | |
287 } else { | |
288 ok&=utrie_setRange32(newTrie, start, limit, value, overwrite); | |
289 } | |
290 } | |
291 if(!ok) { | |
292 log_err("error: setting values into a trie failed (%s)\n", testName); | |
293 return; | |
294 } | |
295 | |
296 /* verify that all these values are in the new Trie */ | |
297 start=0; | |
298 for(i=0; i<countCheckRanges; ++i) { | |
299 limit=checkRanges[i].limit; | |
300 value=checkRanges[i].value; | |
301 | |
302 while(start<limit) { | |
303 if(value!=utrie_get32(newTrie, start, NULL)) { | |
304 log_err("error: newTrie(%s)[U+%04lx]==0x%lx instead of 0x%lx\n", | |
305 testName, start, utrie_get32(newTrie, start, NULL), valu
e); | |
306 } | |
307 ++start; | |
308 } | |
309 } | |
310 | |
311 if(dataIs32) { | |
312 getFoldingOffset=_testFoldingOffset32; | |
313 } else { | |
314 getFoldingOffset=_testFoldingOffset16; | |
315 } | |
316 | |
317 errorCode=U_ZERO_ERROR; | |
318 length=utrie_serialize(newTrie, storage, DEFAULT_STORAGE_SIZE, | |
319 dataIs32 ? _testFoldedValue32 : _testFoldedValue16, | |
320 (UBool)!dataIs32, | |
321 &errorCode); | |
322 if(U_FAILURE(errorCode)) { | |
323 log_err("error: utrie_serialize(%s) failed: %s\n", testName, u_errorName
(errorCode)); | |
324 utrie_close(newTrie); | |
325 return; | |
326 } | |
327 | |
328 /* test linear Latin-1 range from utrie_getData() */ | |
329 if(latin1Linear) { | |
330 uint32_t *data; | |
331 int32_t dataLength; | |
332 | |
333 data=utrie_getData(newTrie, &dataLength); | |
334 start=0; | |
335 for(i=0; i<countCheckRanges && start<=0xff; ++i) { | |
336 limit=checkRanges[i].limit; | |
337 value=checkRanges[i].value; | |
338 | |
339 while(start<limit && start<=0xff) { | |
340 if(value!=data[UTRIE_DATA_BLOCK_LENGTH+start]) { | |
341 log_err("error: newTrie(%s).latin1Data[U+%04lx]==0x%lx inste
ad of 0x%lx\n", | |
342 testName, start, data[UTRIE_DATA_BLOCK_LENGTH+start]
, value); | |
343 } | |
344 ++start; | |
345 } | |
346 } | |
347 } | |
348 | |
349 utrie_close(newTrie); | |
350 | |
351 errorCode=U_ZERO_ERROR; | |
352 if(!utrie_unserialize(&trie, storage, length, &errorCode)) { | |
353 log_err("error: utrie_unserialize() failed, %s\n", u_errorName(errorCode
)); | |
354 return; | |
355 } | |
356 trie.getFoldingOffset=getFoldingOffset; | |
357 | |
358 if(dataIs32!=(trie.data32!=NULL)) { | |
359 log_err("error: trie serialization (%s) did not preserve 32-bitness\n",
testName); | |
360 } | |
361 if(latin1Linear!=trie.isLatin1Linear) { | |
362 log_err("error: trie serialization (%s) did not preserve Latin-1-lineari
ty\n", testName); | |
363 } | |
364 | |
365 /* verify that all these values are in the unserialized Trie */ | |
366 start=0; | |
367 for(i=0; i<countCheckRanges; ++i) { | |
368 limit=checkRanges[i].limit; | |
369 value=checkRanges[i].value; | |
370 | |
371 if(start==0xd800) { | |
372 /* skip surrogates */ | |
373 start=limit; | |
374 continue; | |
375 } | |
376 | |
377 while(start<limit) { | |
378 if(start<=0xffff) { | |
379 if(dataIs32) { | |
380 value2=UTRIE_GET32_FROM_BMP(&trie, start); | |
381 } else { | |
382 value2=UTRIE_GET16_FROM_BMP(&trie, start); | |
383 } | |
384 if(value!=value2) { | |
385 log_err("error: unserialized trie(%s).fromBMP(U+%04lx)==0x%l
x instead of 0x%lx\n", | |
386 testName, start, value2, value); | |
387 } | |
388 if(!U16_IS_LEAD(start)) { | |
389 if(dataIs32) { | |
390 value2=UTRIE_GET32_FROM_LEAD(&trie, start); | |
391 } else { | |
392 value2=UTRIE_GET16_FROM_LEAD(&trie, start); | |
393 } | |
394 if(value!=value2) { | |
395 log_err("error: unserialized trie(%s).fromLead(U+%04lx)=
=0x%lx instead of 0x%lx\n", | |
396 testName, start, value2, value); | |
397 } | |
398 } | |
399 } | |
400 if(dataIs32) { | |
401 UTRIE_GET32(&trie, start, value2); | |
402 } else { | |
403 UTRIE_GET16(&trie, start, value2); | |
404 } | |
405 if(value!=value2) { | |
406 log_err("error: unserialized trie(%s).get(U+%04lx)==0x%lx instea
d of 0x%lx\n", | |
407 testName, start, value2, value); | |
408 } | |
409 ++start; | |
410 } | |
411 } | |
412 | |
413 /* enumerate and verify all ranges */ | |
414 enumRanges=checkRanges+1; | |
415 utrie_enum(&trie, _testEnumValue, _testEnumRange, &enumRanges); | |
416 | |
417 /* test linear Latin-1 range */ | |
418 if(trie.isLatin1Linear) { | |
419 if(trie.data32!=NULL) { | |
420 const uint32_t *latin1=UTRIE_GET32_LATIN1(&trie); | |
421 | |
422 for(start=0; start<0x100; ++start) { | |
423 if(latin1[start]!=UTRIE_GET32_FROM_LEAD(&trie, start)) { | |
424 log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.
get32(U+%04lx)\n", | |
425 testName, start, latin1[start], UTRIE_GET32_FROM_LEA
D(&trie, start), start); | |
426 } | |
427 } | |
428 } else { | |
429 const uint16_t *latin1=UTRIE_GET16_LATIN1(&trie); | |
430 | |
431 for(start=0; start<0x100; ++start) { | |
432 if(latin1[start]!=UTRIE_GET16_FROM_LEAD(&trie, start)) { | |
433 log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.
get16(U+%04lx)\n", | |
434 testName, start, latin1[start], UTRIE_GET16_FROM_LEA
D(&trie, start), start); | |
435 } | |
436 } | |
437 } | |
438 } | |
439 | |
440 testTrieIteration(testName, &trie, checkRanges, countCheckRanges); | |
441 uprv_free(storage); | |
442 } | |
443 | |
444 static void | |
445 testTrieRanges(const char *testName, | |
446 const SetRange setRanges[], int32_t countSetRanges, | |
447 const CheckRange checkRanges[], int32_t countCheckRanges, | |
448 UBool dataIs32, UBool latin1Linear) { | |
449 union{ | |
450 double bogus; /* needed for aligining the storage */ | |
451 uint8_t storage[32768]; | |
452 } storageHolder; | |
453 UTrieGetFoldingOffset *getFoldingOffset; | |
454 UNewTrieGetFoldedValue *getFoldedValue; | |
455 const CheckRange *enumRanges; | |
456 UNewTrie *newTrie; | |
457 UTrie trie={ 0 }; | |
458 uint32_t value, value2; | |
459 UChar32 start, limit; | |
460 int32_t i, length; | |
461 UErrorCode errorCode; | |
462 UBool overwrite, ok; | |
463 | |
464 log_verbose("\ntesting Trie '%s'\n", testName); | |
465 newTrie=utrie_open(NULL, NULL, 2000, | |
466 checkRanges[0].value, checkRanges[0].value, | |
467 latin1Linear); | |
468 | |
469 /* set values from setRanges[] */ | |
470 ok=TRUE; | |
471 for(i=0; i<countSetRanges; ++i) { | |
472 start=setRanges[i].start; | |
473 limit=setRanges[i].limit; | |
474 value=setRanges[i].value; | |
475 overwrite=setRanges[i].overwrite; | |
476 if((limit-start)==1 && overwrite) { | |
477 ok&=utrie_set32(newTrie, start, value); | |
478 } else { | |
479 ok&=utrie_setRange32(newTrie, start, limit, value, overwrite); | |
480 } | |
481 } | |
482 if(!ok) { | |
483 log_err("error: setting values into a trie failed (%s)\n", testName); | |
484 return; | |
485 } | |
486 | |
487 /* verify that all these values are in the new Trie */ | |
488 start=0; | |
489 for(i=0; i<countCheckRanges; ++i) { | |
490 limit=checkRanges[i].limit; | |
491 value=checkRanges[i].value; | |
492 | |
493 while(start<limit) { | |
494 if(value!=utrie_get32(newTrie, start, NULL)) { | |
495 log_err("error: newTrie(%s)[U+%04lx]==0x%lx instead of 0x%lx\n", | |
496 testName, start, utrie_get32(newTrie, start, NULL), valu
e); | |
497 } | |
498 ++start; | |
499 } | |
500 } | |
501 | |
502 if(dataIs32) { | |
503 getFoldingOffset=_testFoldingOffset32; | |
504 getFoldedValue=_testFoldedValue32; | |
505 } else { | |
506 getFoldingOffset=_testFoldingOffset16; | |
507 getFoldedValue=_testFoldedValue16; | |
508 } | |
509 | |
510 /* | |
511 * code coverage for utrie.c/defaultGetFoldedValue(), | |
512 * pick some combination of parameters for selecting the UTrie defaults | |
513 */ | |
514 if(!dataIs32 && latin1Linear) { | |
515 getFoldingOffset=NULL; | |
516 getFoldedValue=NULL; | |
517 } | |
518 | |
519 errorCode=U_ZERO_ERROR; | |
520 length=utrie_serialize(newTrie, storageHolder.storage, sizeof(storageHolder.
storage), | |
521 getFoldedValue, | |
522 (UBool)!dataIs32, | |
523 &errorCode); | |
524 if(U_FAILURE(errorCode)) { | |
525 log_err("error: utrie_serialize(%s) failed: %s\n", testName, u_errorName
(errorCode)); | |
526 utrie_close(newTrie); | |
527 return; | |
528 } | |
529 if (length >= (int32_t)sizeof(storageHolder.storage)) { | |
530 log_err("error: utrie_serialize(%s) needs more memory\n", testName); | |
531 utrie_close(newTrie); | |
532 return; | |
533 } | |
534 | |
535 /* test linear Latin-1 range from utrie_getData() */ | |
536 if(latin1Linear) { | |
537 uint32_t *data; | |
538 int32_t dataLength; | |
539 | |
540 data=utrie_getData(newTrie, &dataLength); | |
541 start=0; | |
542 for(i=0; i<countCheckRanges && start<=0xff; ++i) { | |
543 limit=checkRanges[i].limit; | |
544 value=checkRanges[i].value; | |
545 | |
546 while(start<limit && start<=0xff) { | |
547 if(value!=data[UTRIE_DATA_BLOCK_LENGTH+start]) { | |
548 log_err("error: newTrie(%s).latin1Data[U+%04lx]==0x%lx inste
ad of 0x%lx\n", | |
549 testName, start, data[UTRIE_DATA_BLOCK_LENGTH+start]
, value); | |
550 } | |
551 ++start; | |
552 } | |
553 } | |
554 } | |
555 | |
556 utrie_close(newTrie); | |
557 | |
558 errorCode=U_ZERO_ERROR; | |
559 if(!utrie_unserialize(&trie, storageHolder.storage, length, &errorCode)) { | |
560 log_err("error: utrie_unserialize() failed, %s\n", u_errorName(errorCode
)); | |
561 return; | |
562 } | |
563 if(getFoldingOffset!=NULL) { | |
564 trie.getFoldingOffset=getFoldingOffset; | |
565 } | |
566 | |
567 if(dataIs32!=(trie.data32!=NULL)) { | |
568 log_err("error: trie serialization (%s) did not preserve 32-bitness\n",
testName); | |
569 } | |
570 if(latin1Linear!=trie.isLatin1Linear) { | |
571 log_err("error: trie serialization (%s) did not preserve Latin-1-lineari
ty\n", testName); | |
572 } | |
573 | |
574 /* verify that all these values are in the unserialized Trie */ | |
575 start=0; | |
576 for(i=0; i<countCheckRanges; ++i) { | |
577 limit=checkRanges[i].limit; | |
578 value=checkRanges[i].value; | |
579 | |
580 if(start==0xd800) { | |
581 /* skip surrogates */ | |
582 start=limit; | |
583 continue; | |
584 } | |
585 | |
586 while(start<limit) { | |
587 if(start<=0xffff) { | |
588 if(dataIs32) { | |
589 value2=UTRIE_GET32_FROM_BMP(&trie, start); | |
590 } else { | |
591 value2=UTRIE_GET16_FROM_BMP(&trie, start); | |
592 } | |
593 if(value!=value2) { | |
594 log_err("error: unserialized trie(%s).fromBMP(U+%04lx)==0x%l
x instead of 0x%lx\n", | |
595 testName, start, value2, value); | |
596 } | |
597 if(!U16_IS_LEAD(start)) { | |
598 if(dataIs32) { | |
599 value2=UTRIE_GET32_FROM_LEAD(&trie, start); | |
600 } else { | |
601 value2=UTRIE_GET16_FROM_LEAD(&trie, start); | |
602 } | |
603 if(value!=value2) { | |
604 log_err("error: unserialized trie(%s).fromLead(U+%04lx)=
=0x%lx instead of 0x%lx\n", | |
605 testName, start, value2, value); | |
606 } | |
607 } | |
608 } | |
609 if(dataIs32) { | |
610 UTRIE_GET32(&trie, start, value2); | |
611 } else { | |
612 UTRIE_GET16(&trie, start, value2); | |
613 } | |
614 if(value!=value2) { | |
615 log_err("error: unserialized trie(%s).get(U+%04lx)==0x%lx instea
d of 0x%lx\n", | |
616 testName, start, value2, value); | |
617 } | |
618 ++start; | |
619 } | |
620 } | |
621 | |
622 /* enumerate and verify all ranges */ | |
623 enumRanges=checkRanges+1; | |
624 utrie_enum(&trie, _testEnumValue, _testEnumRange, &enumRanges); | |
625 | |
626 /* test linear Latin-1 range */ | |
627 if(trie.isLatin1Linear) { | |
628 if(trie.data32!=NULL) { | |
629 const uint32_t *latin1=UTRIE_GET32_LATIN1(&trie); | |
630 | |
631 for(start=0; start<0x100; ++start) { | |
632 if(latin1[start]!=UTRIE_GET32_FROM_LEAD(&trie, start)) { | |
633 log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.
get32(U+%04lx)\n", | |
634 testName, start, latin1[start], UTRIE_GET32_FROM_LEA
D(&trie, start), start); | |
635 } | |
636 } | |
637 } else { | |
638 const uint16_t *latin1=UTRIE_GET16_LATIN1(&trie); | |
639 | |
640 for(start=0; start<0x100; ++start) { | |
641 if(latin1[start]!=UTRIE_GET16_FROM_LEAD(&trie, start)) { | |
642 log_err("error: (%s) trie.latin1[U+%04lx]=0x%lx!=0x%lx=trie.
get16(U+%04lx)\n", | |
643 testName, start, latin1[start], UTRIE_GET16_FROM_LEA
D(&trie, start), start); | |
644 } | |
645 } | |
646 } | |
647 } | |
648 | |
649 testTrieIteration(testName, &trie, checkRanges, countCheckRanges); | |
650 } | |
651 | |
652 static void | |
653 testTrieRanges2(const char *testName, | |
654 const SetRange setRanges[], int32_t countSetRanges, | |
655 const CheckRange checkRanges[], int32_t countCheckRanges, | |
656 UBool dataIs32) { | |
657 char name[40]; | |
658 | |
659 testTrieRanges(testName, | |
660 setRanges, countSetRanges, | |
661 checkRanges, countCheckRanges, | |
662 dataIs32, FALSE); | |
663 testTrieRangesWithMalloc(testName, | |
664 setRanges, countSetRanges, | |
665 checkRanges, countCheckRanges, | |
666 dataIs32, FALSE); | |
667 | |
668 uprv_strcpy(name, testName); | |
669 uprv_strcat(name, "-latin1Linear"); | |
670 testTrieRanges(name, | |
671 setRanges, countSetRanges, | |
672 checkRanges, countCheckRanges, | |
673 dataIs32, TRUE); | |
674 testTrieRangesWithMalloc(name, | |
675 setRanges, countSetRanges, | |
676 checkRanges, countCheckRanges, | |
677 dataIs32, TRUE); | |
678 } | |
679 | |
680 static void | |
681 testTrieRanges4(const char *testName, | |
682 const SetRange setRanges[], int32_t countSetRanges, | |
683 const CheckRange checkRanges[], int32_t countCheckRanges) { | |
684 char name[40]; | |
685 | |
686 uprv_strcpy(name, testName); | |
687 uprv_strcat(name, ".32"); | |
688 testTrieRanges2(name, | |
689 setRanges, countSetRanges, | |
690 checkRanges, countCheckRanges, | |
691 TRUE); | |
692 | |
693 uprv_strcpy(name, testName); | |
694 uprv_strcat(name, ".16"); | |
695 testTrieRanges2(name, | |
696 setRanges, countSetRanges, | |
697 checkRanges, countCheckRanges, | |
698 FALSE); | |
699 } | |
700 | |
701 /* test data ----------------------------------------------------------------*/ | |
702 | |
703 /* set consecutive ranges, even with value 0 */ | |
704 static const SetRange | |
705 setRanges1[]={ | |
706 {0, 0x20, 0, FALSE}, | |
707 {0x20, 0xa7, 0x1234, FALSE}, | |
708 {0xa7, 0x3400, 0, FALSE}, | |
709 {0x3400, 0x9fa6, 0x6162, FALSE}, | |
710 {0x9fa6, 0xda9e, 0x3132, FALSE}, | |
711 {0xdada, 0xeeee, 0x87ff, FALSE}, /* try to disrupt _testFoldingOffset16(
) */ | |
712 {0xeeee, 0x11111, 1, FALSE}, | |
713 {0x11111, 0x44444, 0x6162, FALSE}, | |
714 {0x44444, 0x60003, 0, FALSE}, | |
715 {0xf0003, 0xf0004, 0xf, FALSE}, | |
716 {0xf0004, 0xf0006, 0x10, FALSE}, | |
717 {0xf0006, 0xf0007, 0x11, FALSE}, | |
718 {0xf0007, 0xf0020, 0x12, FALSE}, | |
719 {0xf0020, 0x110000, 0, FALSE} | |
720 }; | |
721 | |
722 static const CheckRange | |
723 checkRanges1[]={ | |
724 {0, 0}, /* dummy start range to make _testEnumRange() simpler */ | |
725 {0x20, 0}, | |
726 {0xa7, 0x1234}, | |
727 {0x3400, 0}, | |
728 {0x9fa6, 0x6162}, | |
729 {0xda9e, 0x3132}, | |
730 {0xdada, 0}, | |
731 {0xeeee, 0x87ff}, | |
732 {0x11111,1}, | |
733 {0x44444,0x6162}, | |
734 {0xf0003,0}, | |
735 {0xf0004,0xf}, | |
736 {0xf0006,0x10}, | |
737 {0xf0007,0x11}, | |
738 {0xf0020,0x12}, | |
739 {0x110000, 0} | |
740 }; | |
741 | |
742 /* set some interesting overlapping ranges */ | |
743 static const SetRange | |
744 setRanges2[]={ | |
745 {0x21, 0x7f, 0x5555, TRUE}, | |
746 {0x2f800,0x2fedc, 0x7a, TRUE}, | |
747 {0x72, 0xdd, 3, TRUE}, | |
748 {0xdd, 0xde, 4, FALSE}, | |
749 {0x201, 0x220, 6, TRUE}, /* 3 consecutive blocks with the same p
attern but discontiguous value ranges */ | |
750 {0x221, 0x240, 6, TRUE}, | |
751 {0x241, 0x260, 6, TRUE}, | |
752 {0x2f987,0x2fa98, 5, TRUE}, | |
753 {0x2f777,0x2f833, 0, TRUE}, | |
754 {0x2f900,0x2ffee, 1, FALSE}, | |
755 {0x2ffee,0x2ffef, 2, TRUE} | |
756 }; | |
757 | |
758 static const CheckRange | |
759 checkRanges2[]={ | |
760 {0, 0}, /* dummy start range to make _testEnumRange() simpler */ | |
761 {0x21, 0}, | |
762 {0x72, 0x5555}, | |
763 {0xdd, 3}, | |
764 {0xde, 4}, | |
765 {0x201, 0}, | |
766 {0x220, 6}, | |
767 {0x221, 0}, | |
768 {0x240, 6}, | |
769 {0x241, 0}, | |
770 {0x260, 6}, | |
771 {0x2f833,0}, | |
772 {0x2f987,0x7a}, | |
773 {0x2fa98,5}, | |
774 {0x2fedc,0x7a}, | |
775 {0x2ffee,1}, | |
776 {0x2ffef,2}, | |
777 {0x110000, 0} | |
778 }; | |
779 | |
780 /* use a non-zero initial value */ | |
781 static const SetRange | |
782 setRanges3[]={ | |
783 {0x31, 0xa4, 1, FALSE}, | |
784 {0x3400, 0x6789, 2, FALSE}, | |
785 {0x30000,0x34567,9, TRUE}, | |
786 {0x45678,0x56789,3, TRUE} | |
787 }; | |
788 | |
789 static const CheckRange | |
790 checkRanges3[]={ | |
791 {0, 9}, /* dummy start range, also carries the initial value */ | |
792 {0x31, 9}, | |
793 {0xa4, 1}, | |
794 {0x3400, 9}, | |
795 {0x6789, 2}, | |
796 {0x45678,9}, | |
797 {0x56789,3}, | |
798 {0x110000,9} | |
799 }; | |
800 | |
801 static void | |
802 TrieTest(void) { | |
803 testTrieRanges4("set1", | |
804 setRanges1, ARRAY_LENGTH(setRanges1), | |
805 checkRanges1, ARRAY_LENGTH(checkRanges1)); | |
806 testTrieRanges4("set2-overlap", | |
807 setRanges2, ARRAY_LENGTH(setRanges2), | |
808 checkRanges2, ARRAY_LENGTH(checkRanges2)); | |
809 testTrieRanges4("set3-initial-9", | |
810 setRanges3, ARRAY_LENGTH(setRanges3), | |
811 checkRanges3, ARRAY_LENGTH(checkRanges3)); | |
812 } | |
813 | |
814 /* test utrie_unserializeDummy() -------------------------------------------- */ | |
815 | |
816 static int32_t U_CALLCONV | |
817 dummyGetFoldingOffset(uint32_t data) { | |
818 return -1; /* never get non-initialValue data for supplementary code points
*/ | |
819 } | |
820 | |
821 static void | |
822 dummyTest(UBool make16BitTrie) { | |
823 int32_t mem[UTRIE_DUMMY_SIZE/4]; | |
824 | |
825 UTrie trie; | |
826 UErrorCode errorCode; | |
827 UChar32 c; | |
828 | |
829 uint32_t value, initialValue, leadUnitValue; | |
830 | |
831 if(make16BitTrie) { | |
832 initialValue=0x313; | |
833 leadUnitValue=0xaffe; | |
834 } else { | |
835 initialValue=0x01234567; | |
836 leadUnitValue=0x89abcdef; | |
837 } | |
838 | |
839 errorCode=U_ZERO_ERROR; | |
840 utrie_unserializeDummy(&trie, mem, sizeof(mem), initialValue, leadUnitValue,
make16BitTrie, &errorCode); | |
841 if(U_FAILURE(errorCode)) { | |
842 log_err("utrie_unserializeDummy(make16BitTrie=%d) failed - %s\n", make16
BitTrie, u_errorName(errorCode)); | |
843 return; | |
844 } | |
845 trie.getFoldingOffset=dummyGetFoldingOffset; | |
846 | |
847 /* test that all code points have initialValue */ | |
848 for(c=0; c<=0x10ffff; ++c) { | |
849 if(make16BitTrie) { | |
850 UTRIE_GET16(&trie, c, value); | |
851 } else { | |
852 UTRIE_GET32(&trie, c, value); | |
853 } | |
854 if(value!=initialValue) { | |
855 log_err("UTRIE_GET%s(dummy, U+%04lx)=0x%lx instead of 0x%lx\n", | |
856 make16BitTrie ? "16" : "32", (long)c, (long)value, (long)initial
Value); | |
857 } | |
858 } | |
859 | |
860 /* test that the lead surrogate code units have leadUnitValue */ | |
861 for(c=0xd800; c<=0xdbff; ++c) { | |
862 if(make16BitTrie) { | |
863 value=UTRIE_GET16_FROM_LEAD(&trie, c); | |
864 } else { | |
865 value=UTRIE_GET32_FROM_LEAD(&trie, c); | |
866 } | |
867 if(value!=leadUnitValue) { | |
868 log_err("UTRIE_GET%s_FROM_LEAD(dummy, U+%04lx)=0x%lx instead of 0x%l
x\n", | |
869 make16BitTrie ? "16" : "32", (long)c, (long)value, (long)leadUni
tValue); | |
870 } | |
871 } | |
872 } | |
873 | |
874 static void | |
875 DummyTrieTest(void) { | |
876 dummyTest(TRUE); | |
877 dummyTest(FALSE); | |
878 } | |
879 | |
880 void | |
881 addTrieTest(TestNode** root); | |
882 | |
883 void | |
884 addTrieTest(TestNode** root) { | |
885 addTest(root, &TrieTest, "tsutil/trietest/TrieTest"); | |
886 addTest(root, &DummyTrieTest, "tsutil/trietest/DummyTrieTest"); | |
887 } | |
OLD | NEW |