OLD | NEW |
| (Empty) |
1 /******************************************************************** | |
2 * COPYRIGHT: | |
3 * Copyright (C) 2001-2012 IBM, Inc. All Rights Reserved. | |
4 * | |
5 ********************************************************************/ | |
6 | |
7 #include <stdio.h> | |
8 #include <stdlib.h> | |
9 #include <locale.h> | |
10 #include <limits.h> | |
11 #include <string.h> | |
12 #include "unicode/uperf.h" | |
13 #include "uoptions.h" | |
14 #include "unicode/coll.h" | |
15 #include <unicode/ucoleitr.h> | |
16 | |
17 #if !U_PLATFORM_HAS_WIN32_API | |
18 #define DWORD uint32_t | |
19 #define WCHAR wchar_t | |
20 #endif | |
21 | |
22 /* To store an array of string<UNIT> in continue space. | |
23 Since string<UNIT> itself is treated as an array of UNIT, this | |
24 class will ease our memory management for an array of string<UNIT>. | |
25 */ | |
26 | |
27 //template<typename UNIT> | |
28 #define COMPATCT_ARRAY(CompactArrays, UNIT) \ | |
29 struct CompactArrays{\ | |
30 CompactArrays(const CompactArrays & );\ | |
31 CompactArrays & operator=(const CompactArrays & );\ | |
32 int32_t count;/*total number of the strings*/ \ | |
33 int32_t * index;/*relative offset in data*/ \ | |
34 UNIT * data; /*the real space to hold strings*/ \ | |
35 \ | |
36 ~CompactArrays(){free(index);free(data);} \ | |
37 CompactArrays():data(NULL), index(NULL), count(0){ \ | |
38 index = (int32_t *) realloc(index, sizeof(int32_t)); \ | |
39 index[0] = 0; \ | |
40 } \ | |
41 void append_one(int32_t theLen){ /*include terminal NULL*/ \ | |
42 count++; \ | |
43 index = (int32_t *) realloc(index, sizeof(int32_t) * (count + 1)); \ | |
44 index[count] = index[count - 1] + theLen; \ | |
45 data = (UNIT *) realloc(data, sizeof(UNIT) * index[count]); \ | |
46 } \ | |
47 UNIT * last(){return data + index[count - 1];} \ | |
48 UNIT * dataOf(int32_t i){return data + index[i];} \ | |
49 int32_t lengthOf(int i){return index[i+1] - index[i] - 1; } /*exclude termin
ating NULL*/ \ | |
50 }; | |
51 | |
52 //typedef CompactArrays<UChar> CA_uchar; | |
53 //typedef CompactArrays<char> CA_char; | |
54 //typedef CompactArrays<uint8_t> CA_uint8; | |
55 //typedef CompactArrays<WCHAR> CA_win_wchar; | |
56 | |
57 COMPATCT_ARRAY(CA_uchar, UChar) | |
58 COMPATCT_ARRAY(CA_char, char) | |
59 COMPATCT_ARRAY(CA_uint8, uint8_t) | |
60 COMPATCT_ARRAY(CA_win_wchar, WCHAR) | |
61 | |
62 | |
63 struct DataIndex { | |
64 static DWORD win_langid; // for qsort callback function | |
65 static UCollator * col; // for qsort callback function | |
66 uint8_t * icu_key; | |
67 UChar * icu_data; | |
68 int32_t icu_data_len; | |
69 char* posix_key; | |
70 char* posix_data; | |
71 int32_t posix_data_len; | |
72 char* win_key; | |
73 WCHAR * win_data; | |
74 int32_t win_data_len; | |
75 }; | |
76 DWORD DataIndex::win_langid; | |
77 UCollator * DataIndex::col; | |
78 | |
79 | |
80 | |
81 class CmdKeyGen : public UPerfFunction { | |
82 typedef void (CmdKeyGen::* Func)(int32_t); | |
83 enum{MAX_KEY_LENGTH = 5000}; | |
84 UCollator * col; | |
85 DWORD win_langid; | |
86 int32_t count; | |
87 DataIndex * data; | |
88 Func fn; | |
89 | |
90 union { // to save sapce | |
91 uint8_t icu_key[MAX_KEY_LENGTH]; | |
92 char posix_key[MAX_KEY_LENGTH]; | |
93 WCHAR win_key[MAX_KEY_LENGTH]; | |
94 }; | |
95 public: | |
96 CmdKeyGen(UErrorCode, UCollator * col,DWORD win_langid, int32_t count, DataI
ndex * data,Func fn,int32_t) | |
97 :col(col),win_langid(win_langid), count(count), data(data), fn(fn){} | |
98 | |
99 virtual long getOperationsPerIteration(){return count;} | |
100 | |
101 virtual void call(UErrorCode* status){ | |
102 for(int32_t i = 0; i< count; i++){ | |
103 (this->*fn)(i); | |
104 } | |
105 } | |
106 | |
107 void icu_key_null(int32_t i){ | |
108 ucol_getSortKey(col, data[i].icu_data, -1, icu_key, MAX_KEY_LENGTH); | |
109 } | |
110 | |
111 void icu_key_len(int32_t i){ | |
112 ucol_getSortKey(col, data[i].icu_data, data[i].icu_data_len, icu_key
, MAX_KEY_LENGTH); | |
113 } | |
114 | |
115 #if U_PLATFORM_HAS_WIN32_API | |
116 // pre-generated in CollPerfTest::prepareData(), need not to check error
here | |
117 void win_key_null(int32_t i){ | |
118 //LCMAP_SORTsk 0x00000400 // WC sort sk (normalize) | |
119 LCMapStringW(win_langid, LCMAP_SORTKEY, data[i].win_data, -1, win_ke
y, MAX_KEY_LENGTH); | |
120 } | |
121 | |
122 void win_key_len(int32_t i){ | |
123 LCMapStringW(win_langid, LCMAP_SORTKEY, data[i].win_data, data[i].wi
n_data_len, win_key, MAX_KEY_LENGTH); | |
124 } | |
125 #endif | |
126 | |
127 void posix_key_null(int32_t i){ | |
128 strxfrm(posix_key, data[i].posix_data, MAX_KEY_LENGTH); | |
129 } | |
130 }; | |
131 | |
132 | |
133 class CmdIter : public UPerfFunction { | |
134 typedef void (CmdIter::* Func)(UErrorCode* , int32_t ); | |
135 int32_t count; | |
136 CA_uchar * data; | |
137 Func fn; | |
138 UCollationElements *iter; | |
139 int32_t exec_count; | |
140 public: | |
141 CmdIter(UErrorCode & status, UCollator * col, int32_t count, CA_uchar *data,
Func fn, int32_t,int32_t) | |
142 :count(count), data(data), fn(fn){ | |
143 exec_count = 0; | |
144 UChar dummytext[] = {0, 0}; | |
145 iter = ucol_openElements(col, NULL, 0, &status); | |
146 ucol_setText(iter, dummytext, 1, &status); | |
147 } | |
148 ~CmdIter(){ | |
149 ucol_closeElements(iter); | |
150 } | |
151 | |
152 virtual long getOperationsPerIteration(){return exec_count ? exec_count
: 1;} | |
153 | |
154 virtual void call(UErrorCode* status){ | |
155 exec_count = 0; | |
156 for(int32_t i = 0; i< count; i++){ | |
157 (this->*fn)(status, i); | |
158 } | |
159 } | |
160 | |
161 void icu_forward_null(UErrorCode* status, int32_t i){ | |
162 ucol_setText(iter, data->dataOf(i), -1, status); | |
163 while (ucol_next(iter, status) != UCOL_NULLORDER) exec_count++; | |
164 } | |
165 | |
166 void icu_forward_len(UErrorCode* status, int32_t i){ | |
167 ucol_setText(iter, data->dataOf(i), data->lengthOf(i) , status); | |
168 while (ucol_next(iter, status) != UCOL_NULLORDER) exec_count++; | |
169 } | |
170 | |
171 void icu_backward_null(UErrorCode* status, int32_t i){ | |
172 ucol_setText(iter, data->dataOf(i), -1, status); | |
173 while (ucol_previous(iter, status) != UCOL_NULLORDER) exec_count++; | |
174 } | |
175 | |
176 void icu_backward_len(UErrorCode* status, int32_t i){ | |
177 ucol_setText(iter, data->dataOf(i), data->lengthOf(i) , status); | |
178 while (ucol_previous(iter, status) != UCOL_NULLORDER) exec_count++; | |
179 } | |
180 }; | |
181 | |
182 class CmdIterAll : public UPerfFunction { | |
183 typedef void (CmdIterAll::* Func)(UErrorCode* status); | |
184 int32_t count; | |
185 UChar * data; | |
186 Func fn; | |
187 UCollationElements *iter; | |
188 int32_t exec_count; | |
189 | |
190 public: | |
191 enum CALL {forward_null, forward_len, backward_null, backward_len}; | |
192 | |
193 ~CmdIterAll(){ | |
194 ucol_closeElements(iter); | |
195 } | |
196 CmdIterAll(UErrorCode & status, UCollator * col, int32_t count, UChar * dat
a, CALL call,int32_t,int32_t) | |
197 :count(count),data(data) | |
198 { | |
199 exec_count = 0; | |
200 if (call == forward_null || call == backward_null) { | |
201 iter = ucol_openElements(col, data, -1, &status); | |
202 } else { | |
203 iter = ucol_openElements(col, data, count, &status); | |
204 } | |
205 | |
206 if (call == forward_null || call == forward_len){ | |
207 fn = &CmdIterAll::icu_forward_all; | |
208 } else { | |
209 fn = &CmdIterAll::icu_backward_all; | |
210 } | |
211 } | |
212 virtual long getOperationsPerIteration(){return exec_count ? exec_count : 1;
} | |
213 | |
214 virtual void call(UErrorCode* status){ | |
215 (this->*fn)(status); | |
216 } | |
217 | |
218 void icu_forward_all(UErrorCode* status){ | |
219 int strlen = count - 5; | |
220 int count5 = 5; | |
221 int strindex = 0; | |
222 ucol_setOffset(iter, strindex, status); | |
223 while (TRUE) { | |
224 if (ucol_next(iter, status) == UCOL_NULLORDER) { | |
225 break; | |
226 } | |
227 exec_count++; | |
228 count5 --; | |
229 if (count5 == 0) { | |
230 strindex += 10; | |
231 if (strindex > strlen) { | |
232 break; | |
233 } | |
234 ucol_setOffset(iter, strindex, status); | |
235 count5 = 5; | |
236 } | |
237 } | |
238 } | |
239 | |
240 void icu_backward_all(UErrorCode* status){ | |
241 int strlen = count; | |
242 int count5 = 5; | |
243 int strindex = 5; | |
244 ucol_setOffset(iter, strindex, status); | |
245 while (TRUE) { | |
246 if (ucol_previous(iter, status) == UCOL_NULLORDER) { | |
247 break; | |
248 } | |
249 exec_count++; | |
250 count5 --; | |
251 if (count5 == 0) { | |
252 strindex += 10; | |
253 if (strindex > strlen) { | |
254 break; | |
255 } | |
256 ucol_setOffset(iter, strindex, status); | |
257 count5 = 5; | |
258 } | |
259 } | |
260 } | |
261 | |
262 }; | |
263 | |
264 struct CmdQsort : public UPerfFunction{ | |
265 | |
266 static int q_random(const void * a, const void * b){ | |
267 uint8_t * key_a = ((DataIndex *)a)->icu_key; | |
268 uint8_t * key_b = ((DataIndex *)b)->icu_key; | |
269 | |
270 int val_a = 0; | |
271 int val_b = 0; | |
272 while (*key_a != 0) {val_a += val_a*37 + *key_a++;} | |
273 while (*key_b != 0) {val_b += val_b*37 + *key_b++;} | |
274 return val_a - val_b; | |
275 } | |
276 | |
277 #define QCAST() \ | |
278 DataIndex * da = (DataIndex *) a; \ | |
279 DataIndex * db = (DataIndex *) b; \ | |
280 ++exec_count | |
281 | |
282 static int icu_strcoll_null(const void *a, const void *b){ | |
283 QCAST(); | |
284 return ucol_strcoll(da->col, da->icu_data, -1, db->icu_data, -1) - UCOL_
EQUAL; | |
285 } | |
286 | |
287 static int icu_strcoll_len(const void *a, const void *b){ | |
288 QCAST(); | |
289 return ucol_strcoll(da->col, da->icu_data, da->icu_data_len, db->icu_dat
a, db->icu_data_len) - UCOL_EQUAL; | |
290 } | |
291 | |
292 static int icu_cmpkey (const void *a, const void *b){ | |
293 QCAST(); | |
294 return strcmp((char *) da->icu_key, (char *) db->icu_key); | |
295 } | |
296 | |
297 #if U_PLATFORM_HAS_WIN32_API | |
298 static int win_cmp_null(const void *a, const void *b) { | |
299 QCAST(); | |
300 //CSTR_LESS_THAN 1 | |
301 //CSTR_EQUAL 2 | |
302 //CSTR_GREATER_THAN 3 | |
303 int t = CompareStringW(da->win_langid, 0, da->win_data, -1, db->win_data
, -1); | |
304 if (t == 0){ | |
305 fprintf(stderr, "CompareStringW error, error number %x\n", GetLastEr
ror()); | |
306 exit(-1); | |
307 } else{ | |
308 return t - CSTR_EQUAL; | |
309 } | |
310 } | |
311 | |
312 static int win_cmp_len(const void *a, const void *b) { | |
313 QCAST(); | |
314 int t = CompareStringW(da->win_langid, 0, da->win_data, da->win_data_len
, db->win_data, db->win_data_len); | |
315 if (t == 0){ | |
316 fprintf(stderr, "CompareStringW error, error number %x\n", GetLastEr
ror()); | |
317 exit(-1); | |
318 } else{ | |
319 return t - CSTR_EQUAL; | |
320 } | |
321 } | |
322 #endif | |
323 | |
324 #define QFUNC(name, func, data) \ | |
325 static int name (const void *a, const void *b){ \ | |
326 QCAST(); \ | |
327 return func(da->data, db->data); \ | |
328 } | |
329 | |
330 QFUNC(posix_strcoll_null, strcoll, posix_data) | |
331 QFUNC(posix_cmpkey, strcmp, posix_key) | |
332 #if U_PLATFORM_HAS_WIN32_API | |
333 QFUNC(win_cmpkey, strcmp, win_key) | |
334 QFUNC(win_wcscmp, wcscmp, win_data) | |
335 #endif | |
336 QFUNC(icu_strcmp, u_strcmp, icu_data) | |
337 QFUNC(icu_cmpcpo, u_strcmpCodePointOrder, icu_data) | |
338 | |
339 private: | |
340 static int32_t exec_count; // potential muilt-thread problem | |
341 | |
342 typedef int (* Func)(const void *, const void *); | |
343 | |
344 Func fn; | |
345 void * base; //Start of target array. | |
346 int32_t num; //Array size in elements. | |
347 int32_t width; //Element size in bytes. | |
348 | |
349 void * backup; //copy source of base | |
350 public: | |
351 CmdQsort(UErrorCode & status,void *theBase, int32_t num, int32_t width, Func
fn, int32_t,int32_t) | |
352 :backup(theBase),num(num),width(width),fn(fn){ | |
353 base = malloc(num * width); | |
354 time_empty(100, &status); // warm memory/cache | |
355 } | |
356 | |
357 ~CmdQsort(){ | |
358 free(base); | |
359 } | |
360 | |
361 void empty_call(){ | |
362 exec_count = 0; | |
363 memcpy(base, backup, num * width); | |
364 } | |
365 | |
366 double time_empty(int32_t n, UErrorCode* status) { | |
367 UTimer start, stop; | |
368 utimer_getTime(&start); | |
369 while (n-- > 0) { | |
370 empty_call(); | |
371 } | |
372 utimer_getTime(&stop); | |
373 return utimer_getDeltaSeconds(&start,&stop); // ms | |
374 } | |
375 | |
376 virtual void call(UErrorCode* status){ | |
377 exec_count = 0; | |
378 memcpy(base, backup, num * width); | |
379 qsort(base, num, width, fn); | |
380 } | |
381 virtual double time(int32_t n, UErrorCode* status) { | |
382 double t1 = time_empty(n,status); | |
383 double t2 = UPerfFunction::time(n, status); | |
384 return t2-t1;// < 0 ? t2 : t2-t1; | |
385 } | |
386 | |
387 virtual long getOperationsPerIteration(){ return exec_count?exec_count:1
;} | |
388 }; | |
389 int32_t CmdQsort::exec_count; | |
390 | |
391 | |
392 class CmdBinSearch : public UPerfFunction{ | |
393 public: | |
394 typedef int (CmdBinSearch::* Func)(int, int); | |
395 | |
396 UCollator * col; | |
397 DWORD win_langid; | |
398 int32_t count; | |
399 DataIndex * rnd; | |
400 DataIndex * ord; | |
401 Func fn; | |
402 int32_t exec_count; | |
403 | |
404 CmdBinSearch(UErrorCode, UCollator * col,DWORD win_langid,int32_t count,Data
Index * rnd,DataIndex * ord,Func fn) | |
405 :col(col),win_langid(win_langid), count(count), rnd(rnd), ord(ord), fn(f
n),exec_count(0){} | |
406 | |
407 | |
408 virtual void call(UErrorCode* status){ | |
409 exec_count = 0; | |
410 for(int32_t i = 0; i< count; i++){ // search all data | |
411 binary_search(i); | |
412 } | |
413 } | |
414 virtual long getOperationsPerIteration(){ return exec_count?exec_count:1
;} | |
415 | |
416 void binary_search(int32_t random) { | |
417 int low = 0; | |
418 int high = count - 1; | |
419 int guess; | |
420 int last_guess = -1; | |
421 int r; | |
422 while (TRUE) { | |
423 guess = (high + low)/2; | |
424 if (last_guess == guess) break; // nothing to search | |
425 | |
426 r = (this->*fn)(random, guess); | |
427 exec_count++; | |
428 | |
429 if (r == 0) | |
430 return; // found, search end. | |
431 if (r < 0) { | |
432 high = guess; | |
433 } else { | |
434 low = guess; | |
435 } | |
436 last_guess = guess; | |
437 } | |
438 } | |
439 | |
440 int icu_strcoll_null(int32_t i, int32_t j){ | |
441 return ucol_strcoll(col, rnd[i].icu_data, -1, ord[j].icu_data,-1); | |
442 } | |
443 | |
444 int icu_strcoll_len(int32_t i, int32_t j){ | |
445 return ucol_strcoll(col, rnd[i].icu_data, rnd[i].icu_data_len, ord[j
].icu_data, ord[j].icu_data_len); | |
446 } | |
447 | |
448 int icu_cmpkey(int32_t i, int32_t j) { | |
449 return strcmp( (char *) rnd[i].icu_key, (char *) ord[j].icu_key ); | |
450 } | |
451 | |
452 #if U_PLATFORM_HAS_WIN32_API | |
453 int win_cmp_null(int32_t i, int32_t j) { | |
454 int t = CompareStringW(win_langid, 0, rnd[i].win_data, -1, ord[j].wi
n_data, -1); | |
455 if (t == 0){ | |
456 fprintf(stderr, "CompareStringW error, error number %x\n", GetLa
stError()); | |
457 exit(-1); | |
458 } else{ | |
459 return t - CSTR_EQUAL; | |
460 } | |
461 } | |
462 | |
463 int win_cmp_len(int32_t i, int32_t j) { | |
464 int t = CompareStringW(win_langid, 0, rnd[i].win_data, rnd[i].win_da
ta_len, ord[j].win_data, ord[j].win_data_len); | |
465 if (t == 0){ | |
466 fprintf(stderr, "CompareStringW error, error number %x\n", GetLa
stError()); | |
467 exit(-1); | |
468 } else{ | |
469 return t - CSTR_EQUAL; | |
470 } | |
471 } | |
472 #endif | |
473 | |
474 #define BFUNC(name, func, data) \ | |
475 int name(int32_t i, int32_t j) { \ | |
476 return func(rnd[i].data, ord[j].data); \ | |
477 } | |
478 | |
479 BFUNC(posix_strcoll_null, strcoll, posix_data) | |
480 BFUNC(posix_cmpkey, strcmp, posix_key) | |
481 BFUNC(win_cmpkey, strcmp, win_key) | |
482 BFUNC(win_wcscmp, wcscmp, win_data) | |
483 BFUNC(icu_strcmp, u_strcmp, icu_data) | |
484 BFUNC(icu_cmpcpo, u_strcmpCodePointOrder, icu_data) | |
485 }; | |
486 | |
487 class CollPerfTest : public UPerfTest { | |
488 public: | |
489 UCollator * col; | |
490 DWORD win_langid; | |
491 | |
492 UChar * icu_data_all; | |
493 int32_t icu_data_all_len; | |
494 | |
495 int32_t count; | |
496 CA_uchar * icu_data; | |
497 CA_uint8 * icu_key; | |
498 CA_char * posix_data; | |
499 CA_char * posix_key; | |
500 CA_win_wchar * win_data; | |
501 CA_char * win_key; | |
502 | |
503 DataIndex * rnd_index; // random by icu key | |
504 DataIndex * ord_win_data; | |
505 DataIndex * ord_win_key; | |
506 DataIndex * ord_posix_data; | |
507 DataIndex * ord_posix_key; | |
508 DataIndex * ord_icu_data; | |
509 DataIndex * ord_icu_key; | |
510 DataIndex * ord_win_wcscmp; | |
511 DataIndex * ord_icu_strcmp; | |
512 DataIndex * ord_icu_cmpcpo; | |
513 | |
514 virtual ~CollPerfTest(){ | |
515 ucol_close(col); | |
516 delete [] icu_data_all; | |
517 delete icu_data; | |
518 delete icu_key; | |
519 delete posix_data; | |
520 delete posix_key; | |
521 delete win_data; | |
522 delete win_key; | |
523 delete[] rnd_index; | |
524 delete[] ord_win_data; | |
525 delete[] ord_win_key; | |
526 delete[] ord_posix_data; | |
527 delete[] ord_posix_key; | |
528 delete[] ord_icu_data; | |
529 delete[] ord_icu_key; | |
530 delete[] ord_win_wcscmp; | |
531 delete[] ord_icu_strcmp; | |
532 delete[] ord_icu_cmpcpo; | |
533 } | |
534 | |
535 CollPerfTest(int32_t argc, const char* argv[], UErrorCode& status):UPerfTest
(argc, argv, status){ | |
536 col = NULL; | |
537 icu_data_all = NULL; | |
538 icu_data = NULL; | |
539 icu_key = NULL; | |
540 posix_data = NULL; | |
541 posix_key = NULL; | |
542 win_data =NULL; | |
543 win_key = NULL; | |
544 | |
545 rnd_index = NULL; | |
546 ord_win_data= NULL; | |
547 ord_win_key= NULL; | |
548 ord_posix_data= NULL; | |
549 ord_posix_key= NULL; | |
550 ord_icu_data= NULL; | |
551 ord_icu_key= NULL; | |
552 ord_win_wcscmp = NULL; | |
553 ord_icu_strcmp = NULL; | |
554 ord_icu_cmpcpo = NULL; | |
555 | |
556 if (U_FAILURE(status)){ | |
557 return; | |
558 } | |
559 | |
560 // Parse additional arguments | |
561 | |
562 UOption options[] = { | |
563 UOPTION_DEF("langid", 'i', UOPT_REQUIRES_ARG), // Windows Lan
guage ID number. | |
564 UOPTION_DEF("rulefile", 'r', UOPT_REQUIRES_ARG), // --rulef
ile <filename> | |
565 // Collation related arguments. All are optional. | |
566 // To simplify parsing, two choice arguments are disigned as NO_
ARG. | |
567 // The default value is UPPER word in the comment | |
568 UOPTION_DEF("c_french", 'f', UOPT_NO_ARG), // --french
<on | OFF> | |
569 UOPTION_DEF("c_alternate", 'a', UOPT_NO_ARG), // --alterna
te <NON_IGNORE | shifted> | |
570 UOPTION_DEF("c_casefirst", 'c', UOPT_REQUIRES_ARG), // --casefir
st <lower | upper | OFF> | |
571 UOPTION_DEF("c_caselevel", 'l', UOPT_NO_ARG), // --caselev
el <on | OFF> | |
572 UOPTION_DEF("c_normal", 'n', UOPT_NO_ARG), // --normal
<on | OFF> | |
573 UOPTION_DEF("c_strength", 's', UOPT_REQUIRES_ARG), // --strengt
h <1-5> | |
574 }; | |
575 int32_t opt_len = (sizeof(options)/sizeof(options[0])); | |
576 enum {i, r,f,a,c,l,n,s}; // The buffer between the option items' order
and their references | |
577 | |
578 _remainingArgc = u_parseArgs(_remainingArgc, (char**)argv, opt_len, opti
ons); | |
579 | |
580 if (_remainingArgc < 0){ | |
581 status = U_ILLEGAL_ARGUMENT_ERROR; | |
582 return; | |
583 } | |
584 | |
585 if (locale == NULL){ | |
586 locale = "en_US"; // set default locale | |
587 } | |
588 | |
589 #if U_PLATFORM_HAS_WIN32_API | |
590 if (options[i].doesOccur) { | |
591 char *endp; | |
592 int tmp = strtol(options[i].value, &endp, 0); | |
593 if (endp == options[i].value) { | |
594 status = U_ILLEGAL_ARGUMENT_ERROR; | |
595 return; | |
596 } | |
597 win_langid = MAKELCID(tmp, SORT_DEFAULT); | |
598 } else { | |
599 win_langid = uloc_getLCID(locale); | |
600 } | |
601 #endif | |
602 | |
603 // Set up an ICU collator | |
604 if (options[r].doesOccur) { | |
605 // TODO: implement it | |
606 } else { | |
607 col = ucol_open(locale, &status); | |
608 if (U_FAILURE(status)) { | |
609 return; | |
610 } | |
611 } | |
612 | |
613 if (options[f].doesOccur) { | |
614 ucol_setAttribute(col, UCOL_FRENCH_COLLATION, UCOL_ON, &status); | |
615 } else { | |
616 ucol_setAttribute(col, UCOL_FRENCH_COLLATION, UCOL_OFF, &status); | |
617 } | |
618 | |
619 if (options[a].doesOccur) { | |
620 ucol_setAttribute(col, UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, &statu
s); | |
621 } | |
622 | |
623 if (options[c].doesOccur) { // strcmp() has i18n encoding problem | |
624 if (strcmp("lower", options[c].value) == 0){ | |
625 ucol_setAttribute(col, UCOL_CASE_FIRST, UCOL_LOWER_FIRST, &statu
s); | |
626 } else if (strcmp("upper", options[c].value) == 0) { | |
627 ucol_setAttribute(col, UCOL_CASE_FIRST, UCOL_UPPER_FIRST, &statu
s); | |
628 } else { | |
629 status = U_ILLEGAL_ARGUMENT_ERROR; | |
630 return; | |
631 } | |
632 } | |
633 | |
634 if (options[l].doesOccur){ | |
635 ucol_setAttribute(col, UCOL_CASE_LEVEL, UCOL_ON, &status); | |
636 } | |
637 | |
638 if (options[n].doesOccur){ | |
639 ucol_setAttribute(col, UCOL_NORMALIZATION_MODE, UCOL_ON, &status); | |
640 } | |
641 | |
642 if (options[s].doesOccur) { | |
643 char *endp; | |
644 int tmp = strtol(options[l].value, &endp, 0); | |
645 if (endp == options[l].value) { | |
646 status = U_ILLEGAL_ARGUMENT_ERROR; | |
647 return; | |
648 } | |
649 switch (tmp) { | |
650 case 1: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_PRIMARY, &sta
tus); break; | |
651 case 2: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_SECONDARY, &s
tatus); break; | |
652 case 3: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_TERTIARY, &st
atus); break; | |
653 case 4: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_QUATERNARY, &
status); break; | |
654 case 5: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_IDENTICAL, &s
tatus); break; | |
655 default: status = U_ILLEGAL_ARGUMENT_ERROR;
return; | |
656 } | |
657 } | |
658 prepareData(status); | |
659 } | |
660 | |
661 //to avoid use the annoying 'id' in TESTCASE(id,test) macro or the like | |
662 #define TEST(testname, classname, arg1, arg2, arg3, arg4, arg5, arg6) \ | |
663 if(temp == index) {\ | |
664 name = #testname;\ | |
665 if (exec) {\ | |
666 UErrorCode status = U_ZERO_ERROR;\ | |
667 UPerfFunction * t = new classname(status,arg1, arg2, arg3, arg4, arg5, arg6)
;\ | |
668 if (U_FAILURE(status)) {\ | |
669 delete t;\ | |
670 return NULL;\ | |
671 } else {\ | |
672 return t;\ | |
673 }\ | |
674 } else {\ | |
675 return NULL;\ | |
676 }\ | |
677 }\ | |
678 temp++\ | |
679 | |
680 | |
681 virtual UPerfFunction* runIndexedTest( /*[in]*/int32_t index, /*[in]*/UBool
exec, /*[out]*/const char* &name, /*[in]*/ char* par = NULL ){ | |
682 int temp = 0; | |
683 | |
684 #define TEST_KEYGEN(testname, func)\ | |
685 TEST(testname, CmdKeyGen, col, win_langid, count, rnd_index, &CmdKeyGen::fun
c, 0) | |
686 TEST_KEYGEN(TestIcu_KeyGen_null, icu_key_null); | |
687 TEST_KEYGEN(TestIcu_KeyGen_len, icu_key_len); | |
688 TEST_KEYGEN(TestPosix_KeyGen_null, posix_key_null); | |
689 #if U_PLATFORM_HAS_WIN32_API | |
690 TEST_KEYGEN(TestWin_KeyGen_null, win_key_null); | |
691 TEST_KEYGEN(TestWin_KeyGen_len, win_key_len); | |
692 #endif | |
693 | |
694 #define TEST_ITER(testname, func)\ | |
695 TEST(testname, CmdIter, col, count, icu_data, &CmdIter::func,0,0) | |
696 TEST_ITER(TestIcu_ForwardIter_null, icu_forward_null); | |
697 TEST_ITER(TestIcu_ForwardIter_len, icu_forward_len); | |
698 TEST_ITER(TestIcu_BackwardIter_null, icu_backward_null); | |
699 TEST_ITER(TestIcu_BackwardIter_len, icu_backward_len); | |
700 | |
701 #define TEST_ITER_ALL(testname, func)\ | |
702 TEST(testname, CmdIterAll, col, icu_data_all_len, icu_data_all, CmdIterAll::
func,0,0) | |
703 TEST_ITER_ALL(TestIcu_ForwardIter_all_null, forward_null); | |
704 TEST_ITER_ALL(TestIcu_ForwardIter_all_len, forward_len); | |
705 TEST_ITER_ALL(TestIcu_BackwardIter_all_null, backward_null); | |
706 TEST_ITER_ALL(TestIcu_BackwardIter_all_len, backward_len); | |
707 | |
708 #define TEST_QSORT(testname, func)\ | |
709 TEST(testname, CmdQsort, rnd_index, count, sizeof(DataIndex), CmdQsort::func
,0,0) | |
710 TEST_QSORT(TestIcu_qsort_strcoll_null, icu_strcoll_null); | |
711 TEST_QSORT(TestIcu_qsort_strcoll_len, icu_strcoll_len); | |
712 TEST_QSORT(TestIcu_qsort_usekey, icu_cmpkey); | |
713 TEST_QSORT(TestPosix_qsort_strcoll_null, posix_strcoll_null); | |
714 TEST_QSORT(TestPosix_qsort_usekey, posix_cmpkey); | |
715 #if U_PLATFORM_HAS_WIN32_API | |
716 TEST_QSORT(TestWin_qsort_CompareStringW_null, win_cmp_null); | |
717 TEST_QSORT(TestWin_qsort_CompareStringW_len, win_cmp_len); | |
718 TEST_QSORT(TestWin_qsort_usekey, win_cmpkey); | |
719 #endif | |
720 | |
721 #define TEST_BIN(testname, func)\ | |
722 TEST(testname, CmdBinSearch, col, win_langid, count, rnd_index, ord_icu_key,
&CmdBinSearch::func) | |
723 TEST_BIN(TestIcu_BinarySearch_strcoll_null, icu_strcoll_null); | |
724 TEST_BIN(TestIcu_BinarySearch_strcoll_len, icu_strcoll_len); | |
725 TEST_BIN(TestIcu_BinarySearch_usekey, icu_cmpkey); | |
726 TEST_BIN(TestIcu_BinarySearch_strcmp, icu_strcmp); | |
727 TEST_BIN(TestIcu_BinarySearch_cmpCPO, icu_cmpcpo); | |
728 TEST_BIN(TestPosix_BinarySearch_strcoll_null, posix_strcoll_null); | |
729 TEST_BIN(TestPosix_BinarySearch_usekey, posix_cmpkey); | |
730 #if U_PLATFORM_HAS_WIN32_API | |
731 TEST_BIN(TestWin_BinarySearch_CompareStringW_null, win_cmp_null); | |
732 TEST_BIN(TestWin_BinarySearch_CompareStringW_len, win_cmp_len); | |
733 #endif | |
734 TEST_BIN(TestWin_BinarySearch_usekey, win_cmpkey); | |
735 TEST_BIN(TestWin_BinarySearch_wcscmp, win_wcscmp); | |
736 | |
737 name=""; | |
738 return NULL; | |
739 } | |
740 | |
741 | |
742 | |
743 void prepareData(UErrorCode& status){ | |
744 if(U_FAILURE(status)) return; | |
745 if (icu_data) return; // prepared | |
746 | |
747 icu_data = new CA_uchar(); | |
748 | |
749 // Following code is borrowed from UPerfTest::getLines(); | |
750 const UChar* line=NULL; | |
751 int32_t len =0; | |
752 for (;;) { | |
753 line = ucbuf_readline(ucharBuf,&len,&status); | |
754 if(line == NULL || U_FAILURE(status)){break;} | |
755 | |
756 // Refer to the source code of ucbuf_readline() | |
757 // 1. 'len' includs the line terminal symbols | |
758 // 2. The length of the line terminal symbols is only one character | |
759 // 3. The Windows CR LF line terminal symbols will be converted to C
R | |
760 | |
761 if (len == 1) { | |
762 continue; //skip empty line | |
763 } else { | |
764 icu_data->append_one(len); | |
765 memcpy(icu_data->last(), line, len * sizeof(UChar)); | |
766 icu_data->last()[len -1] = NULL; | |
767 } | |
768 } | |
769 if(U_FAILURE(status)) return; | |
770 | |
771 // UTF-16 -> UTF-8 conversion. | |
772 UConverter *conv = ucnv_open("utf-8", &status); // just UTF-8 for now. | |
773 if (U_FAILURE(status)) return; | |
774 | |
775 count = icu_data->count; | |
776 | |
777 icu_data_all_len = icu_data->index[count]; // includes all NULLs | |
778 icu_data_all_len -= count; // excludes all NULLs | |
779 icu_data_all_len += 1; // the terminal NULL | |
780 icu_data_all = new UChar[icu_data_all_len]; | |
781 icu_data_all[icu_data_all_len - 1] = 0; //the terminal NULL | |
782 | |
783 icu_key = new CA_uint8; | |
784 win_data = new CA_win_wchar; | |
785 win_key = new CA_char; | |
786 posix_data = new CA_char; | |
787 posix_key = new CA_char; | |
788 rnd_index = new DataIndex[count]; | |
789 DataIndex::win_langid = win_langid; | |
790 DataIndex::col = col; | |
791 | |
792 | |
793 UChar * p = icu_data_all; | |
794 int32_t s; | |
795 int32_t t; | |
796 for (int i=0; i < count; i++) { | |
797 // ICU all data | |
798 s = sizeof(UChar) * icu_data->lengthOf(i); | |
799 memcpy(p, icu_data->dataOf(i), s); | |
800 p += icu_data->lengthOf(i); | |
801 | |
802 // ICU data | |
803 | |
804 // ICU key | |
805 s = ucol_getSortKey(col, icu_data->dataOf(i), -1,NULL, 0); | |
806 icu_key->append_one(s); | |
807 t = ucol_getSortKey(col, icu_data->dataOf(i), -1,icu_key->last(), s)
; | |
808 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
809 | |
810 // POSIX data | |
811 s = ucnv_fromUChars(conv,NULL, 0, icu_data->dataOf(i), icu_data->len
gthOf(i), &status); | |
812 if (status == U_BUFFER_OVERFLOW_ERROR || status == U_ZERO_ERROR){ | |
813 status = U_ZERO_ERROR; | |
814 } else { | |
815 return; | |
816 } | |
817 posix_data->append_one(s + 1); // plus terminal NULL | |
818 t = ucnv_fromUChars(conv,posix_data->last(), s, icu_data->dataOf(i),
icu_data->lengthOf(i), &status); | |
819 if (U_FAILURE(status)) return; | |
820 if ( t != s){status = U_INVALID_FORMAT_ERROR;return;} | |
821 posix_data->last()[s] = 0; | |
822 | |
823 // POSIX key | |
824 s = strxfrm(NULL, posix_data->dataOf(i), 0); | |
825 if (s == INT_MAX){status = U_INVALID_FORMAT_ERROR;return;} | |
826 posix_key->append_one(s); | |
827 t = strxfrm(posix_key->last(), posix_data->dataOf(i), s); | |
828 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
829 | |
830 #if U_PLATFORM_HAS_WIN32_API | |
831 // Win data | |
832 s = icu_data->lengthOf(i) + 1; // plus terminal NULL | |
833 win_data->append_one(s); | |
834 memcpy(win_data->last(), icu_data->dataOf(i), sizeof(WCHAR) * s); | |
835 | |
836 // Win key | |
837 s = LCMapStringW(win_langid, LCMAP_SORTKEY, win_data->dataOf(i), win
_data->lengthOf(i), NULL,0); | |
838 if (s == 0) {status = U_INVALID_FORMAT_ERROR;return;} | |
839 win_key->append_one(s); | |
840 t = LCMapStringW(win_langid, LCMAP_SORTKEY, win_data->dataOf(i), win
_data->lengthOf(i), (WCHAR *)(win_key->last()),s); | |
841 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
842 #endif | |
843 }; | |
844 | |
845 // append_one() will make points shifting, should not merge following co
de into previous iteration | |
846 for (int i=0; i < count; i++) { | |
847 rnd_index[i].icu_key = icu_key->dataOf(i); | |
848 rnd_index[i].icu_data = icu_data->dataOf(i); | |
849 rnd_index[i].icu_data_len = icu_data->lengthOf(i); | |
850 rnd_index[i].posix_key = posix_key->last(); | |
851 rnd_index[i].posix_data = posix_data->dataOf(i); | |
852 rnd_index[i].posix_data_len = posix_data->lengthOf(i); | |
853 #if U_PLATFORM_HAS_WIN32_API | |
854 rnd_index[i].win_key = win_key->dataOf(i); | |
855 rnd_index[i].win_data = win_data->dataOf(i); | |
856 rnd_index[i].win_data_len = win_data->lengthOf(i); | |
857 #endif | |
858 }; | |
859 | |
860 ucnv_close(conv); | |
861 qsort(rnd_index, count, sizeof(DataIndex), CmdQsort::q_random); | |
862 | |
863 #define SORT(data, func) \ | |
864 data = new DataIndex[count];\ | |
865 memcpy(data, rnd_index, count * sizeof(DataIndex));\ | |
866 qsort(data, count, sizeof(DataIndex), CmdQsort::func) | |
867 | |
868 SORT(ord_icu_data, icu_strcoll_len); | |
869 SORT(ord_icu_key, icu_cmpkey); | |
870 SORT(ord_posix_data, posix_strcoll_null); | |
871 SORT(ord_posix_key, posix_cmpkey); | |
872 #if U_PLATFORM_HAS_WIN32_API | |
873 SORT(ord_win_data, win_cmp_len); | |
874 SORT(ord_win_key, win_cmpkey); | |
875 SORT(ord_win_wcscmp, win_wcscmp); | |
876 #endif | |
877 SORT(ord_icu_strcmp, icu_strcmp); | |
878 SORT(ord_icu_cmpcpo, icu_cmpcpo); | |
879 } | |
880 }; | |
881 | |
882 | |
883 int main(int argc, const char *argv[]) | |
884 { | |
885 | |
886 UErrorCode status = U_ZERO_ERROR; | |
887 CollPerfTest test(argc, argv, status); | |
888 | |
889 if (U_FAILURE(status)){ | |
890 printf("The error is %s\n", u_errorName(status)); | |
891 //TODO: print usage here | |
892 return status; | |
893 } | |
894 | |
895 if (test.run() == FALSE){ | |
896 fprintf(stderr, "FAILED: Tests could not be run please check the " | |
897 "arguments.\n"); | |
898 return -1; | |
899 } | |
900 return 0; | |
901 } | |
902 | |
OLD | NEW |