| OLD | NEW |
| (Empty) |
| 1 /******************************************************************** | |
| 2 * COPYRIGHT: | |
| 3 * Copyright (C) 2001-2012 IBM, Inc. All Rights Reserved. | |
| 4 * | |
| 5 ********************************************************************/ | |
| 6 | |
| 7 #include <stdio.h> | |
| 8 #include <stdlib.h> | |
| 9 #include <locale.h> | |
| 10 #include <limits.h> | |
| 11 #include <string.h> | |
| 12 #include "unicode/uperf.h" | |
| 13 #include "uoptions.h" | |
| 14 #include "unicode/coll.h" | |
| 15 #include <unicode/ucoleitr.h> | |
| 16 | |
| 17 #if !U_PLATFORM_HAS_WIN32_API | |
| 18 #define DWORD uint32_t | |
| 19 #define WCHAR wchar_t | |
| 20 #endif | |
| 21 | |
| 22 /* To store an array of string<UNIT> in continue space. | |
| 23 Since string<UNIT> itself is treated as an array of UNIT, this | |
| 24 class will ease our memory management for an array of string<UNIT>. | |
| 25 */ | |
| 26 | |
| 27 //template<typename UNIT> | |
| 28 #define COMPATCT_ARRAY(CompactArrays, UNIT) \ | |
| 29 struct CompactArrays{\ | |
| 30 CompactArrays(const CompactArrays & );\ | |
| 31 CompactArrays & operator=(const CompactArrays & );\ | |
| 32 int32_t count;/*total number of the strings*/ \ | |
| 33 int32_t * index;/*relative offset in data*/ \ | |
| 34 UNIT * data; /*the real space to hold strings*/ \ | |
| 35 \ | |
| 36 ~CompactArrays(){free(index);free(data);} \ | |
| 37 CompactArrays():data(NULL), index(NULL), count(0){ \ | |
| 38 index = (int32_t *) realloc(index, sizeof(int32_t)); \ | |
| 39 index[0] = 0; \ | |
| 40 } \ | |
| 41 void append_one(int32_t theLen){ /*include terminal NULL*/ \ | |
| 42 count++; \ | |
| 43 index = (int32_t *) realloc(index, sizeof(int32_t) * (count + 1)); \ | |
| 44 index[count] = index[count - 1] + theLen; \ | |
| 45 data = (UNIT *) realloc(data, sizeof(UNIT) * index[count]); \ | |
| 46 } \ | |
| 47 UNIT * last(){return data + index[count - 1];} \ | |
| 48 UNIT * dataOf(int32_t i){return data + index[i];} \ | |
| 49 int32_t lengthOf(int i){return index[i+1] - index[i] - 1; } /*exclude termin
ating NULL*/ \ | |
| 50 }; | |
| 51 | |
| 52 //typedef CompactArrays<UChar> CA_uchar; | |
| 53 //typedef CompactArrays<char> CA_char; | |
| 54 //typedef CompactArrays<uint8_t> CA_uint8; | |
| 55 //typedef CompactArrays<WCHAR> CA_win_wchar; | |
| 56 | |
| 57 COMPATCT_ARRAY(CA_uchar, UChar) | |
| 58 COMPATCT_ARRAY(CA_char, char) | |
| 59 COMPATCT_ARRAY(CA_uint8, uint8_t) | |
| 60 COMPATCT_ARRAY(CA_win_wchar, WCHAR) | |
| 61 | |
| 62 | |
| 63 struct DataIndex { | |
| 64 static DWORD win_langid; // for qsort callback function | |
| 65 static UCollator * col; // for qsort callback function | |
| 66 uint8_t * icu_key; | |
| 67 UChar * icu_data; | |
| 68 int32_t icu_data_len; | |
| 69 char* posix_key; | |
| 70 char* posix_data; | |
| 71 int32_t posix_data_len; | |
| 72 char* win_key; | |
| 73 WCHAR * win_data; | |
| 74 int32_t win_data_len; | |
| 75 }; | |
| 76 DWORD DataIndex::win_langid; | |
| 77 UCollator * DataIndex::col; | |
| 78 | |
| 79 | |
| 80 | |
| 81 class CmdKeyGen : public UPerfFunction { | |
| 82 typedef void (CmdKeyGen::* Func)(int32_t); | |
| 83 enum{MAX_KEY_LENGTH = 5000}; | |
| 84 UCollator * col; | |
| 85 DWORD win_langid; | |
| 86 int32_t count; | |
| 87 DataIndex * data; | |
| 88 Func fn; | |
| 89 | |
| 90 union { // to save sapce | |
| 91 uint8_t icu_key[MAX_KEY_LENGTH]; | |
| 92 char posix_key[MAX_KEY_LENGTH]; | |
| 93 WCHAR win_key[MAX_KEY_LENGTH]; | |
| 94 }; | |
| 95 public: | |
| 96 CmdKeyGen(UErrorCode, UCollator * col,DWORD win_langid, int32_t count, DataI
ndex * data,Func fn,int32_t) | |
| 97 :col(col),win_langid(win_langid), count(count), data(data), fn(fn){} | |
| 98 | |
| 99 virtual long getOperationsPerIteration(){return count;} | |
| 100 | |
| 101 virtual void call(UErrorCode* status){ | |
| 102 for(int32_t i = 0; i< count; i++){ | |
| 103 (this->*fn)(i); | |
| 104 } | |
| 105 } | |
| 106 | |
| 107 void icu_key_null(int32_t i){ | |
| 108 ucol_getSortKey(col, data[i].icu_data, -1, icu_key, MAX_KEY_LENGTH); | |
| 109 } | |
| 110 | |
| 111 void icu_key_len(int32_t i){ | |
| 112 ucol_getSortKey(col, data[i].icu_data, data[i].icu_data_len, icu_key
, MAX_KEY_LENGTH); | |
| 113 } | |
| 114 | |
| 115 #if U_PLATFORM_HAS_WIN32_API | |
| 116 // pre-generated in CollPerfTest::prepareData(), need not to check error
here | |
| 117 void win_key_null(int32_t i){ | |
| 118 //LCMAP_SORTsk 0x00000400 // WC sort sk (normalize) | |
| 119 LCMapStringW(win_langid, LCMAP_SORTKEY, data[i].win_data, -1, win_ke
y, MAX_KEY_LENGTH); | |
| 120 } | |
| 121 | |
| 122 void win_key_len(int32_t i){ | |
| 123 LCMapStringW(win_langid, LCMAP_SORTKEY, data[i].win_data, data[i].wi
n_data_len, win_key, MAX_KEY_LENGTH); | |
| 124 } | |
| 125 #endif | |
| 126 | |
| 127 void posix_key_null(int32_t i){ | |
| 128 strxfrm(posix_key, data[i].posix_data, MAX_KEY_LENGTH); | |
| 129 } | |
| 130 }; | |
| 131 | |
| 132 | |
| 133 class CmdIter : public UPerfFunction { | |
| 134 typedef void (CmdIter::* Func)(UErrorCode* , int32_t ); | |
| 135 int32_t count; | |
| 136 CA_uchar * data; | |
| 137 Func fn; | |
| 138 UCollationElements *iter; | |
| 139 int32_t exec_count; | |
| 140 public: | |
| 141 CmdIter(UErrorCode & status, UCollator * col, int32_t count, CA_uchar *data,
Func fn, int32_t,int32_t) | |
| 142 :count(count), data(data), fn(fn){ | |
| 143 exec_count = 0; | |
| 144 UChar dummytext[] = {0, 0}; | |
| 145 iter = ucol_openElements(col, NULL, 0, &status); | |
| 146 ucol_setText(iter, dummytext, 1, &status); | |
| 147 } | |
| 148 ~CmdIter(){ | |
| 149 ucol_closeElements(iter); | |
| 150 } | |
| 151 | |
| 152 virtual long getOperationsPerIteration(){return exec_count ? exec_count
: 1;} | |
| 153 | |
| 154 virtual void call(UErrorCode* status){ | |
| 155 exec_count = 0; | |
| 156 for(int32_t i = 0; i< count; i++){ | |
| 157 (this->*fn)(status, i); | |
| 158 } | |
| 159 } | |
| 160 | |
| 161 void icu_forward_null(UErrorCode* status, int32_t i){ | |
| 162 ucol_setText(iter, data->dataOf(i), -1, status); | |
| 163 while (ucol_next(iter, status) != UCOL_NULLORDER) exec_count++; | |
| 164 } | |
| 165 | |
| 166 void icu_forward_len(UErrorCode* status, int32_t i){ | |
| 167 ucol_setText(iter, data->dataOf(i), data->lengthOf(i) , status); | |
| 168 while (ucol_next(iter, status) != UCOL_NULLORDER) exec_count++; | |
| 169 } | |
| 170 | |
| 171 void icu_backward_null(UErrorCode* status, int32_t i){ | |
| 172 ucol_setText(iter, data->dataOf(i), -1, status); | |
| 173 while (ucol_previous(iter, status) != UCOL_NULLORDER) exec_count++; | |
| 174 } | |
| 175 | |
| 176 void icu_backward_len(UErrorCode* status, int32_t i){ | |
| 177 ucol_setText(iter, data->dataOf(i), data->lengthOf(i) , status); | |
| 178 while (ucol_previous(iter, status) != UCOL_NULLORDER) exec_count++; | |
| 179 } | |
| 180 }; | |
| 181 | |
| 182 class CmdIterAll : public UPerfFunction { | |
| 183 typedef void (CmdIterAll::* Func)(UErrorCode* status); | |
| 184 int32_t count; | |
| 185 UChar * data; | |
| 186 Func fn; | |
| 187 UCollationElements *iter; | |
| 188 int32_t exec_count; | |
| 189 | |
| 190 public: | |
| 191 enum CALL {forward_null, forward_len, backward_null, backward_len}; | |
| 192 | |
| 193 ~CmdIterAll(){ | |
| 194 ucol_closeElements(iter); | |
| 195 } | |
| 196 CmdIterAll(UErrorCode & status, UCollator * col, int32_t count, UChar * dat
a, CALL call,int32_t,int32_t) | |
| 197 :count(count),data(data) | |
| 198 { | |
| 199 exec_count = 0; | |
| 200 if (call == forward_null || call == backward_null) { | |
| 201 iter = ucol_openElements(col, data, -1, &status); | |
| 202 } else { | |
| 203 iter = ucol_openElements(col, data, count, &status); | |
| 204 } | |
| 205 | |
| 206 if (call == forward_null || call == forward_len){ | |
| 207 fn = &CmdIterAll::icu_forward_all; | |
| 208 } else { | |
| 209 fn = &CmdIterAll::icu_backward_all; | |
| 210 } | |
| 211 } | |
| 212 virtual long getOperationsPerIteration(){return exec_count ? exec_count : 1;
} | |
| 213 | |
| 214 virtual void call(UErrorCode* status){ | |
| 215 (this->*fn)(status); | |
| 216 } | |
| 217 | |
| 218 void icu_forward_all(UErrorCode* status){ | |
| 219 int strlen = count - 5; | |
| 220 int count5 = 5; | |
| 221 int strindex = 0; | |
| 222 ucol_setOffset(iter, strindex, status); | |
| 223 while (TRUE) { | |
| 224 if (ucol_next(iter, status) == UCOL_NULLORDER) { | |
| 225 break; | |
| 226 } | |
| 227 exec_count++; | |
| 228 count5 --; | |
| 229 if (count5 == 0) { | |
| 230 strindex += 10; | |
| 231 if (strindex > strlen) { | |
| 232 break; | |
| 233 } | |
| 234 ucol_setOffset(iter, strindex, status); | |
| 235 count5 = 5; | |
| 236 } | |
| 237 } | |
| 238 } | |
| 239 | |
| 240 void icu_backward_all(UErrorCode* status){ | |
| 241 int strlen = count; | |
| 242 int count5 = 5; | |
| 243 int strindex = 5; | |
| 244 ucol_setOffset(iter, strindex, status); | |
| 245 while (TRUE) { | |
| 246 if (ucol_previous(iter, status) == UCOL_NULLORDER) { | |
| 247 break; | |
| 248 } | |
| 249 exec_count++; | |
| 250 count5 --; | |
| 251 if (count5 == 0) { | |
| 252 strindex += 10; | |
| 253 if (strindex > strlen) { | |
| 254 break; | |
| 255 } | |
| 256 ucol_setOffset(iter, strindex, status); | |
| 257 count5 = 5; | |
| 258 } | |
| 259 } | |
| 260 } | |
| 261 | |
| 262 }; | |
| 263 | |
| 264 struct CmdQsort : public UPerfFunction{ | |
| 265 | |
| 266 static int q_random(const void * a, const void * b){ | |
| 267 uint8_t * key_a = ((DataIndex *)a)->icu_key; | |
| 268 uint8_t * key_b = ((DataIndex *)b)->icu_key; | |
| 269 | |
| 270 int val_a = 0; | |
| 271 int val_b = 0; | |
| 272 while (*key_a != 0) {val_a += val_a*37 + *key_a++;} | |
| 273 while (*key_b != 0) {val_b += val_b*37 + *key_b++;} | |
| 274 return val_a - val_b; | |
| 275 } | |
| 276 | |
| 277 #define QCAST() \ | |
| 278 DataIndex * da = (DataIndex *) a; \ | |
| 279 DataIndex * db = (DataIndex *) b; \ | |
| 280 ++exec_count | |
| 281 | |
| 282 static int icu_strcoll_null(const void *a, const void *b){ | |
| 283 QCAST(); | |
| 284 return ucol_strcoll(da->col, da->icu_data, -1, db->icu_data, -1) - UCOL_
EQUAL; | |
| 285 } | |
| 286 | |
| 287 static int icu_strcoll_len(const void *a, const void *b){ | |
| 288 QCAST(); | |
| 289 return ucol_strcoll(da->col, da->icu_data, da->icu_data_len, db->icu_dat
a, db->icu_data_len) - UCOL_EQUAL; | |
| 290 } | |
| 291 | |
| 292 static int icu_cmpkey (const void *a, const void *b){ | |
| 293 QCAST(); | |
| 294 return strcmp((char *) da->icu_key, (char *) db->icu_key); | |
| 295 } | |
| 296 | |
| 297 #if U_PLATFORM_HAS_WIN32_API | |
| 298 static int win_cmp_null(const void *a, const void *b) { | |
| 299 QCAST(); | |
| 300 //CSTR_LESS_THAN 1 | |
| 301 //CSTR_EQUAL 2 | |
| 302 //CSTR_GREATER_THAN 3 | |
| 303 int t = CompareStringW(da->win_langid, 0, da->win_data, -1, db->win_data
, -1); | |
| 304 if (t == 0){ | |
| 305 fprintf(stderr, "CompareStringW error, error number %x\n", GetLastEr
ror()); | |
| 306 exit(-1); | |
| 307 } else{ | |
| 308 return t - CSTR_EQUAL; | |
| 309 } | |
| 310 } | |
| 311 | |
| 312 static int win_cmp_len(const void *a, const void *b) { | |
| 313 QCAST(); | |
| 314 int t = CompareStringW(da->win_langid, 0, da->win_data, da->win_data_len
, db->win_data, db->win_data_len); | |
| 315 if (t == 0){ | |
| 316 fprintf(stderr, "CompareStringW error, error number %x\n", GetLastEr
ror()); | |
| 317 exit(-1); | |
| 318 } else{ | |
| 319 return t - CSTR_EQUAL; | |
| 320 } | |
| 321 } | |
| 322 #endif | |
| 323 | |
| 324 #define QFUNC(name, func, data) \ | |
| 325 static int name (const void *a, const void *b){ \ | |
| 326 QCAST(); \ | |
| 327 return func(da->data, db->data); \ | |
| 328 } | |
| 329 | |
| 330 QFUNC(posix_strcoll_null, strcoll, posix_data) | |
| 331 QFUNC(posix_cmpkey, strcmp, posix_key) | |
| 332 #if U_PLATFORM_HAS_WIN32_API | |
| 333 QFUNC(win_cmpkey, strcmp, win_key) | |
| 334 QFUNC(win_wcscmp, wcscmp, win_data) | |
| 335 #endif | |
| 336 QFUNC(icu_strcmp, u_strcmp, icu_data) | |
| 337 QFUNC(icu_cmpcpo, u_strcmpCodePointOrder, icu_data) | |
| 338 | |
| 339 private: | |
| 340 static int32_t exec_count; // potential muilt-thread problem | |
| 341 | |
| 342 typedef int (* Func)(const void *, const void *); | |
| 343 | |
| 344 Func fn; | |
| 345 void * base; //Start of target array. | |
| 346 int32_t num; //Array size in elements. | |
| 347 int32_t width; //Element size in bytes. | |
| 348 | |
| 349 void * backup; //copy source of base | |
| 350 public: | |
| 351 CmdQsort(UErrorCode & status,void *theBase, int32_t num, int32_t width, Func
fn, int32_t,int32_t) | |
| 352 :backup(theBase),num(num),width(width),fn(fn){ | |
| 353 base = malloc(num * width); | |
| 354 time_empty(100, &status); // warm memory/cache | |
| 355 } | |
| 356 | |
| 357 ~CmdQsort(){ | |
| 358 free(base); | |
| 359 } | |
| 360 | |
| 361 void empty_call(){ | |
| 362 exec_count = 0; | |
| 363 memcpy(base, backup, num * width); | |
| 364 } | |
| 365 | |
| 366 double time_empty(int32_t n, UErrorCode* status) { | |
| 367 UTimer start, stop; | |
| 368 utimer_getTime(&start); | |
| 369 while (n-- > 0) { | |
| 370 empty_call(); | |
| 371 } | |
| 372 utimer_getTime(&stop); | |
| 373 return utimer_getDeltaSeconds(&start,&stop); // ms | |
| 374 } | |
| 375 | |
| 376 virtual void call(UErrorCode* status){ | |
| 377 exec_count = 0; | |
| 378 memcpy(base, backup, num * width); | |
| 379 qsort(base, num, width, fn); | |
| 380 } | |
| 381 virtual double time(int32_t n, UErrorCode* status) { | |
| 382 double t1 = time_empty(n,status); | |
| 383 double t2 = UPerfFunction::time(n, status); | |
| 384 return t2-t1;// < 0 ? t2 : t2-t1; | |
| 385 } | |
| 386 | |
| 387 virtual long getOperationsPerIteration(){ return exec_count?exec_count:1
;} | |
| 388 }; | |
| 389 int32_t CmdQsort::exec_count; | |
| 390 | |
| 391 | |
| 392 class CmdBinSearch : public UPerfFunction{ | |
| 393 public: | |
| 394 typedef int (CmdBinSearch::* Func)(int, int); | |
| 395 | |
| 396 UCollator * col; | |
| 397 DWORD win_langid; | |
| 398 int32_t count; | |
| 399 DataIndex * rnd; | |
| 400 DataIndex * ord; | |
| 401 Func fn; | |
| 402 int32_t exec_count; | |
| 403 | |
| 404 CmdBinSearch(UErrorCode, UCollator * col,DWORD win_langid,int32_t count,Data
Index * rnd,DataIndex * ord,Func fn) | |
| 405 :col(col),win_langid(win_langid), count(count), rnd(rnd), ord(ord), fn(f
n),exec_count(0){} | |
| 406 | |
| 407 | |
| 408 virtual void call(UErrorCode* status){ | |
| 409 exec_count = 0; | |
| 410 for(int32_t i = 0; i< count; i++){ // search all data | |
| 411 binary_search(i); | |
| 412 } | |
| 413 } | |
| 414 virtual long getOperationsPerIteration(){ return exec_count?exec_count:1
;} | |
| 415 | |
| 416 void binary_search(int32_t random) { | |
| 417 int low = 0; | |
| 418 int high = count - 1; | |
| 419 int guess; | |
| 420 int last_guess = -1; | |
| 421 int r; | |
| 422 while (TRUE) { | |
| 423 guess = (high + low)/2; | |
| 424 if (last_guess == guess) break; // nothing to search | |
| 425 | |
| 426 r = (this->*fn)(random, guess); | |
| 427 exec_count++; | |
| 428 | |
| 429 if (r == 0) | |
| 430 return; // found, search end. | |
| 431 if (r < 0) { | |
| 432 high = guess; | |
| 433 } else { | |
| 434 low = guess; | |
| 435 } | |
| 436 last_guess = guess; | |
| 437 } | |
| 438 } | |
| 439 | |
| 440 int icu_strcoll_null(int32_t i, int32_t j){ | |
| 441 return ucol_strcoll(col, rnd[i].icu_data, -1, ord[j].icu_data,-1); | |
| 442 } | |
| 443 | |
| 444 int icu_strcoll_len(int32_t i, int32_t j){ | |
| 445 return ucol_strcoll(col, rnd[i].icu_data, rnd[i].icu_data_len, ord[j
].icu_data, ord[j].icu_data_len); | |
| 446 } | |
| 447 | |
| 448 int icu_cmpkey(int32_t i, int32_t j) { | |
| 449 return strcmp( (char *) rnd[i].icu_key, (char *) ord[j].icu_key ); | |
| 450 } | |
| 451 | |
| 452 #if U_PLATFORM_HAS_WIN32_API | |
| 453 int win_cmp_null(int32_t i, int32_t j) { | |
| 454 int t = CompareStringW(win_langid, 0, rnd[i].win_data, -1, ord[j].wi
n_data, -1); | |
| 455 if (t == 0){ | |
| 456 fprintf(stderr, "CompareStringW error, error number %x\n", GetLa
stError()); | |
| 457 exit(-1); | |
| 458 } else{ | |
| 459 return t - CSTR_EQUAL; | |
| 460 } | |
| 461 } | |
| 462 | |
| 463 int win_cmp_len(int32_t i, int32_t j) { | |
| 464 int t = CompareStringW(win_langid, 0, rnd[i].win_data, rnd[i].win_da
ta_len, ord[j].win_data, ord[j].win_data_len); | |
| 465 if (t == 0){ | |
| 466 fprintf(stderr, "CompareStringW error, error number %x\n", GetLa
stError()); | |
| 467 exit(-1); | |
| 468 } else{ | |
| 469 return t - CSTR_EQUAL; | |
| 470 } | |
| 471 } | |
| 472 #endif | |
| 473 | |
| 474 #define BFUNC(name, func, data) \ | |
| 475 int name(int32_t i, int32_t j) { \ | |
| 476 return func(rnd[i].data, ord[j].data); \ | |
| 477 } | |
| 478 | |
| 479 BFUNC(posix_strcoll_null, strcoll, posix_data) | |
| 480 BFUNC(posix_cmpkey, strcmp, posix_key) | |
| 481 BFUNC(win_cmpkey, strcmp, win_key) | |
| 482 BFUNC(win_wcscmp, wcscmp, win_data) | |
| 483 BFUNC(icu_strcmp, u_strcmp, icu_data) | |
| 484 BFUNC(icu_cmpcpo, u_strcmpCodePointOrder, icu_data) | |
| 485 }; | |
| 486 | |
| 487 class CollPerfTest : public UPerfTest { | |
| 488 public: | |
| 489 UCollator * col; | |
| 490 DWORD win_langid; | |
| 491 | |
| 492 UChar * icu_data_all; | |
| 493 int32_t icu_data_all_len; | |
| 494 | |
| 495 int32_t count; | |
| 496 CA_uchar * icu_data; | |
| 497 CA_uint8 * icu_key; | |
| 498 CA_char * posix_data; | |
| 499 CA_char * posix_key; | |
| 500 CA_win_wchar * win_data; | |
| 501 CA_char * win_key; | |
| 502 | |
| 503 DataIndex * rnd_index; // random by icu key | |
| 504 DataIndex * ord_win_data; | |
| 505 DataIndex * ord_win_key; | |
| 506 DataIndex * ord_posix_data; | |
| 507 DataIndex * ord_posix_key; | |
| 508 DataIndex * ord_icu_data; | |
| 509 DataIndex * ord_icu_key; | |
| 510 DataIndex * ord_win_wcscmp; | |
| 511 DataIndex * ord_icu_strcmp; | |
| 512 DataIndex * ord_icu_cmpcpo; | |
| 513 | |
| 514 virtual ~CollPerfTest(){ | |
| 515 ucol_close(col); | |
| 516 delete [] icu_data_all; | |
| 517 delete icu_data; | |
| 518 delete icu_key; | |
| 519 delete posix_data; | |
| 520 delete posix_key; | |
| 521 delete win_data; | |
| 522 delete win_key; | |
| 523 delete[] rnd_index; | |
| 524 delete[] ord_win_data; | |
| 525 delete[] ord_win_key; | |
| 526 delete[] ord_posix_data; | |
| 527 delete[] ord_posix_key; | |
| 528 delete[] ord_icu_data; | |
| 529 delete[] ord_icu_key; | |
| 530 delete[] ord_win_wcscmp; | |
| 531 delete[] ord_icu_strcmp; | |
| 532 delete[] ord_icu_cmpcpo; | |
| 533 } | |
| 534 | |
| 535 CollPerfTest(int32_t argc, const char* argv[], UErrorCode& status):UPerfTest
(argc, argv, status){ | |
| 536 col = NULL; | |
| 537 icu_data_all = NULL; | |
| 538 icu_data = NULL; | |
| 539 icu_key = NULL; | |
| 540 posix_data = NULL; | |
| 541 posix_key = NULL; | |
| 542 win_data =NULL; | |
| 543 win_key = NULL; | |
| 544 | |
| 545 rnd_index = NULL; | |
| 546 ord_win_data= NULL; | |
| 547 ord_win_key= NULL; | |
| 548 ord_posix_data= NULL; | |
| 549 ord_posix_key= NULL; | |
| 550 ord_icu_data= NULL; | |
| 551 ord_icu_key= NULL; | |
| 552 ord_win_wcscmp = NULL; | |
| 553 ord_icu_strcmp = NULL; | |
| 554 ord_icu_cmpcpo = NULL; | |
| 555 | |
| 556 if (U_FAILURE(status)){ | |
| 557 return; | |
| 558 } | |
| 559 | |
| 560 // Parse additional arguments | |
| 561 | |
| 562 UOption options[] = { | |
| 563 UOPTION_DEF("langid", 'i', UOPT_REQUIRES_ARG), // Windows Lan
guage ID number. | |
| 564 UOPTION_DEF("rulefile", 'r', UOPT_REQUIRES_ARG), // --rulef
ile <filename> | |
| 565 // Collation related arguments. All are optional. | |
| 566 // To simplify parsing, two choice arguments are disigned as NO_
ARG. | |
| 567 // The default value is UPPER word in the comment | |
| 568 UOPTION_DEF("c_french", 'f', UOPT_NO_ARG), // --french
<on | OFF> | |
| 569 UOPTION_DEF("c_alternate", 'a', UOPT_NO_ARG), // --alterna
te <NON_IGNORE | shifted> | |
| 570 UOPTION_DEF("c_casefirst", 'c', UOPT_REQUIRES_ARG), // --casefir
st <lower | upper | OFF> | |
| 571 UOPTION_DEF("c_caselevel", 'l', UOPT_NO_ARG), // --caselev
el <on | OFF> | |
| 572 UOPTION_DEF("c_normal", 'n', UOPT_NO_ARG), // --normal
<on | OFF> | |
| 573 UOPTION_DEF("c_strength", 's', UOPT_REQUIRES_ARG), // --strengt
h <1-5> | |
| 574 }; | |
| 575 int32_t opt_len = (sizeof(options)/sizeof(options[0])); | |
| 576 enum {i, r,f,a,c,l,n,s}; // The buffer between the option items' order
and their references | |
| 577 | |
| 578 _remainingArgc = u_parseArgs(_remainingArgc, (char**)argv, opt_len, opti
ons); | |
| 579 | |
| 580 if (_remainingArgc < 0){ | |
| 581 status = U_ILLEGAL_ARGUMENT_ERROR; | |
| 582 return; | |
| 583 } | |
| 584 | |
| 585 if (locale == NULL){ | |
| 586 locale = "en_US"; // set default locale | |
| 587 } | |
| 588 | |
| 589 #if U_PLATFORM_HAS_WIN32_API | |
| 590 if (options[i].doesOccur) { | |
| 591 char *endp; | |
| 592 int tmp = strtol(options[i].value, &endp, 0); | |
| 593 if (endp == options[i].value) { | |
| 594 status = U_ILLEGAL_ARGUMENT_ERROR; | |
| 595 return; | |
| 596 } | |
| 597 win_langid = MAKELCID(tmp, SORT_DEFAULT); | |
| 598 } else { | |
| 599 win_langid = uloc_getLCID(locale); | |
| 600 } | |
| 601 #endif | |
| 602 | |
| 603 // Set up an ICU collator | |
| 604 if (options[r].doesOccur) { | |
| 605 // TODO: implement it | |
| 606 } else { | |
| 607 col = ucol_open(locale, &status); | |
| 608 if (U_FAILURE(status)) { | |
| 609 return; | |
| 610 } | |
| 611 } | |
| 612 | |
| 613 if (options[f].doesOccur) { | |
| 614 ucol_setAttribute(col, UCOL_FRENCH_COLLATION, UCOL_ON, &status); | |
| 615 } else { | |
| 616 ucol_setAttribute(col, UCOL_FRENCH_COLLATION, UCOL_OFF, &status); | |
| 617 } | |
| 618 | |
| 619 if (options[a].doesOccur) { | |
| 620 ucol_setAttribute(col, UCOL_ALTERNATE_HANDLING, UCOL_SHIFTED, &statu
s); | |
| 621 } | |
| 622 | |
| 623 if (options[c].doesOccur) { // strcmp() has i18n encoding problem | |
| 624 if (strcmp("lower", options[c].value) == 0){ | |
| 625 ucol_setAttribute(col, UCOL_CASE_FIRST, UCOL_LOWER_FIRST, &statu
s); | |
| 626 } else if (strcmp("upper", options[c].value) == 0) { | |
| 627 ucol_setAttribute(col, UCOL_CASE_FIRST, UCOL_UPPER_FIRST, &statu
s); | |
| 628 } else { | |
| 629 status = U_ILLEGAL_ARGUMENT_ERROR; | |
| 630 return; | |
| 631 } | |
| 632 } | |
| 633 | |
| 634 if (options[l].doesOccur){ | |
| 635 ucol_setAttribute(col, UCOL_CASE_LEVEL, UCOL_ON, &status); | |
| 636 } | |
| 637 | |
| 638 if (options[n].doesOccur){ | |
| 639 ucol_setAttribute(col, UCOL_NORMALIZATION_MODE, UCOL_ON, &status); | |
| 640 } | |
| 641 | |
| 642 if (options[s].doesOccur) { | |
| 643 char *endp; | |
| 644 int tmp = strtol(options[l].value, &endp, 0); | |
| 645 if (endp == options[l].value) { | |
| 646 status = U_ILLEGAL_ARGUMENT_ERROR; | |
| 647 return; | |
| 648 } | |
| 649 switch (tmp) { | |
| 650 case 1: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_PRIMARY, &sta
tus); break; | |
| 651 case 2: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_SECONDARY, &s
tatus); break; | |
| 652 case 3: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_TERTIARY, &st
atus); break; | |
| 653 case 4: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_QUATERNARY, &
status); break; | |
| 654 case 5: ucol_setAttribute(col, UCOL_STRENGTH, UCOL_IDENTICAL, &s
tatus); break; | |
| 655 default: status = U_ILLEGAL_ARGUMENT_ERROR;
return; | |
| 656 } | |
| 657 } | |
| 658 prepareData(status); | |
| 659 } | |
| 660 | |
| 661 //to avoid use the annoying 'id' in TESTCASE(id,test) macro or the like | |
| 662 #define TEST(testname, classname, arg1, arg2, arg3, arg4, arg5, arg6) \ | |
| 663 if(temp == index) {\ | |
| 664 name = #testname;\ | |
| 665 if (exec) {\ | |
| 666 UErrorCode status = U_ZERO_ERROR;\ | |
| 667 UPerfFunction * t = new classname(status,arg1, arg2, arg3, arg4, arg5, arg6)
;\ | |
| 668 if (U_FAILURE(status)) {\ | |
| 669 delete t;\ | |
| 670 return NULL;\ | |
| 671 } else {\ | |
| 672 return t;\ | |
| 673 }\ | |
| 674 } else {\ | |
| 675 return NULL;\ | |
| 676 }\ | |
| 677 }\ | |
| 678 temp++\ | |
| 679 | |
| 680 | |
| 681 virtual UPerfFunction* runIndexedTest( /*[in]*/int32_t index, /*[in]*/UBool
exec, /*[out]*/const char* &name, /*[in]*/ char* par = NULL ){ | |
| 682 int temp = 0; | |
| 683 | |
| 684 #define TEST_KEYGEN(testname, func)\ | |
| 685 TEST(testname, CmdKeyGen, col, win_langid, count, rnd_index, &CmdKeyGen::fun
c, 0) | |
| 686 TEST_KEYGEN(TestIcu_KeyGen_null, icu_key_null); | |
| 687 TEST_KEYGEN(TestIcu_KeyGen_len, icu_key_len); | |
| 688 TEST_KEYGEN(TestPosix_KeyGen_null, posix_key_null); | |
| 689 #if U_PLATFORM_HAS_WIN32_API | |
| 690 TEST_KEYGEN(TestWin_KeyGen_null, win_key_null); | |
| 691 TEST_KEYGEN(TestWin_KeyGen_len, win_key_len); | |
| 692 #endif | |
| 693 | |
| 694 #define TEST_ITER(testname, func)\ | |
| 695 TEST(testname, CmdIter, col, count, icu_data, &CmdIter::func,0,0) | |
| 696 TEST_ITER(TestIcu_ForwardIter_null, icu_forward_null); | |
| 697 TEST_ITER(TestIcu_ForwardIter_len, icu_forward_len); | |
| 698 TEST_ITER(TestIcu_BackwardIter_null, icu_backward_null); | |
| 699 TEST_ITER(TestIcu_BackwardIter_len, icu_backward_len); | |
| 700 | |
| 701 #define TEST_ITER_ALL(testname, func)\ | |
| 702 TEST(testname, CmdIterAll, col, icu_data_all_len, icu_data_all, CmdIterAll::
func,0,0) | |
| 703 TEST_ITER_ALL(TestIcu_ForwardIter_all_null, forward_null); | |
| 704 TEST_ITER_ALL(TestIcu_ForwardIter_all_len, forward_len); | |
| 705 TEST_ITER_ALL(TestIcu_BackwardIter_all_null, backward_null); | |
| 706 TEST_ITER_ALL(TestIcu_BackwardIter_all_len, backward_len); | |
| 707 | |
| 708 #define TEST_QSORT(testname, func)\ | |
| 709 TEST(testname, CmdQsort, rnd_index, count, sizeof(DataIndex), CmdQsort::func
,0,0) | |
| 710 TEST_QSORT(TestIcu_qsort_strcoll_null, icu_strcoll_null); | |
| 711 TEST_QSORT(TestIcu_qsort_strcoll_len, icu_strcoll_len); | |
| 712 TEST_QSORT(TestIcu_qsort_usekey, icu_cmpkey); | |
| 713 TEST_QSORT(TestPosix_qsort_strcoll_null, posix_strcoll_null); | |
| 714 TEST_QSORT(TestPosix_qsort_usekey, posix_cmpkey); | |
| 715 #if U_PLATFORM_HAS_WIN32_API | |
| 716 TEST_QSORT(TestWin_qsort_CompareStringW_null, win_cmp_null); | |
| 717 TEST_QSORT(TestWin_qsort_CompareStringW_len, win_cmp_len); | |
| 718 TEST_QSORT(TestWin_qsort_usekey, win_cmpkey); | |
| 719 #endif | |
| 720 | |
| 721 #define TEST_BIN(testname, func)\ | |
| 722 TEST(testname, CmdBinSearch, col, win_langid, count, rnd_index, ord_icu_key,
&CmdBinSearch::func) | |
| 723 TEST_BIN(TestIcu_BinarySearch_strcoll_null, icu_strcoll_null); | |
| 724 TEST_BIN(TestIcu_BinarySearch_strcoll_len, icu_strcoll_len); | |
| 725 TEST_BIN(TestIcu_BinarySearch_usekey, icu_cmpkey); | |
| 726 TEST_BIN(TestIcu_BinarySearch_strcmp, icu_strcmp); | |
| 727 TEST_BIN(TestIcu_BinarySearch_cmpCPO, icu_cmpcpo); | |
| 728 TEST_BIN(TestPosix_BinarySearch_strcoll_null, posix_strcoll_null); | |
| 729 TEST_BIN(TestPosix_BinarySearch_usekey, posix_cmpkey); | |
| 730 #if U_PLATFORM_HAS_WIN32_API | |
| 731 TEST_BIN(TestWin_BinarySearch_CompareStringW_null, win_cmp_null); | |
| 732 TEST_BIN(TestWin_BinarySearch_CompareStringW_len, win_cmp_len); | |
| 733 #endif | |
| 734 TEST_BIN(TestWin_BinarySearch_usekey, win_cmpkey); | |
| 735 TEST_BIN(TestWin_BinarySearch_wcscmp, win_wcscmp); | |
| 736 | |
| 737 name=""; | |
| 738 return NULL; | |
| 739 } | |
| 740 | |
| 741 | |
| 742 | |
| 743 void prepareData(UErrorCode& status){ | |
| 744 if(U_FAILURE(status)) return; | |
| 745 if (icu_data) return; // prepared | |
| 746 | |
| 747 icu_data = new CA_uchar(); | |
| 748 | |
| 749 // Following code is borrowed from UPerfTest::getLines(); | |
| 750 const UChar* line=NULL; | |
| 751 int32_t len =0; | |
| 752 for (;;) { | |
| 753 line = ucbuf_readline(ucharBuf,&len,&status); | |
| 754 if(line == NULL || U_FAILURE(status)){break;} | |
| 755 | |
| 756 // Refer to the source code of ucbuf_readline() | |
| 757 // 1. 'len' includs the line terminal symbols | |
| 758 // 2. The length of the line terminal symbols is only one character | |
| 759 // 3. The Windows CR LF line terminal symbols will be converted to C
R | |
| 760 | |
| 761 if (len == 1) { | |
| 762 continue; //skip empty line | |
| 763 } else { | |
| 764 icu_data->append_one(len); | |
| 765 memcpy(icu_data->last(), line, len * sizeof(UChar)); | |
| 766 icu_data->last()[len -1] = NULL; | |
| 767 } | |
| 768 } | |
| 769 if(U_FAILURE(status)) return; | |
| 770 | |
| 771 // UTF-16 -> UTF-8 conversion. | |
| 772 UConverter *conv = ucnv_open("utf-8", &status); // just UTF-8 for now. | |
| 773 if (U_FAILURE(status)) return; | |
| 774 | |
| 775 count = icu_data->count; | |
| 776 | |
| 777 icu_data_all_len = icu_data->index[count]; // includes all NULLs | |
| 778 icu_data_all_len -= count; // excludes all NULLs | |
| 779 icu_data_all_len += 1; // the terminal NULL | |
| 780 icu_data_all = new UChar[icu_data_all_len]; | |
| 781 icu_data_all[icu_data_all_len - 1] = 0; //the terminal NULL | |
| 782 | |
| 783 icu_key = new CA_uint8; | |
| 784 win_data = new CA_win_wchar; | |
| 785 win_key = new CA_char; | |
| 786 posix_data = new CA_char; | |
| 787 posix_key = new CA_char; | |
| 788 rnd_index = new DataIndex[count]; | |
| 789 DataIndex::win_langid = win_langid; | |
| 790 DataIndex::col = col; | |
| 791 | |
| 792 | |
| 793 UChar * p = icu_data_all; | |
| 794 int32_t s; | |
| 795 int32_t t; | |
| 796 for (int i=0; i < count; i++) { | |
| 797 // ICU all data | |
| 798 s = sizeof(UChar) * icu_data->lengthOf(i); | |
| 799 memcpy(p, icu_data->dataOf(i), s); | |
| 800 p += icu_data->lengthOf(i); | |
| 801 | |
| 802 // ICU data | |
| 803 | |
| 804 // ICU key | |
| 805 s = ucol_getSortKey(col, icu_data->dataOf(i), -1,NULL, 0); | |
| 806 icu_key->append_one(s); | |
| 807 t = ucol_getSortKey(col, icu_data->dataOf(i), -1,icu_key->last(), s)
; | |
| 808 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
| 809 | |
| 810 // POSIX data | |
| 811 s = ucnv_fromUChars(conv,NULL, 0, icu_data->dataOf(i), icu_data->len
gthOf(i), &status); | |
| 812 if (status == U_BUFFER_OVERFLOW_ERROR || status == U_ZERO_ERROR){ | |
| 813 status = U_ZERO_ERROR; | |
| 814 } else { | |
| 815 return; | |
| 816 } | |
| 817 posix_data->append_one(s + 1); // plus terminal NULL | |
| 818 t = ucnv_fromUChars(conv,posix_data->last(), s, icu_data->dataOf(i),
icu_data->lengthOf(i), &status); | |
| 819 if (U_FAILURE(status)) return; | |
| 820 if ( t != s){status = U_INVALID_FORMAT_ERROR;return;} | |
| 821 posix_data->last()[s] = 0; | |
| 822 | |
| 823 // POSIX key | |
| 824 s = strxfrm(NULL, posix_data->dataOf(i), 0); | |
| 825 if (s == INT_MAX){status = U_INVALID_FORMAT_ERROR;return;} | |
| 826 posix_key->append_one(s); | |
| 827 t = strxfrm(posix_key->last(), posix_data->dataOf(i), s); | |
| 828 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
| 829 | |
| 830 #if U_PLATFORM_HAS_WIN32_API | |
| 831 // Win data | |
| 832 s = icu_data->lengthOf(i) + 1; // plus terminal NULL | |
| 833 win_data->append_one(s); | |
| 834 memcpy(win_data->last(), icu_data->dataOf(i), sizeof(WCHAR) * s); | |
| 835 | |
| 836 // Win key | |
| 837 s = LCMapStringW(win_langid, LCMAP_SORTKEY, win_data->dataOf(i), win
_data->lengthOf(i), NULL,0); | |
| 838 if (s == 0) {status = U_INVALID_FORMAT_ERROR;return;} | |
| 839 win_key->append_one(s); | |
| 840 t = LCMapStringW(win_langid, LCMAP_SORTKEY, win_data->dataOf(i), win
_data->lengthOf(i), (WCHAR *)(win_key->last()),s); | |
| 841 if (t != s) {status = U_INVALID_FORMAT_ERROR;return;} | |
| 842 #endif | |
| 843 }; | |
| 844 | |
| 845 // append_one() will make points shifting, should not merge following co
de into previous iteration | |
| 846 for (int i=0; i < count; i++) { | |
| 847 rnd_index[i].icu_key = icu_key->dataOf(i); | |
| 848 rnd_index[i].icu_data = icu_data->dataOf(i); | |
| 849 rnd_index[i].icu_data_len = icu_data->lengthOf(i); | |
| 850 rnd_index[i].posix_key = posix_key->last(); | |
| 851 rnd_index[i].posix_data = posix_data->dataOf(i); | |
| 852 rnd_index[i].posix_data_len = posix_data->lengthOf(i); | |
| 853 #if U_PLATFORM_HAS_WIN32_API | |
| 854 rnd_index[i].win_key = win_key->dataOf(i); | |
| 855 rnd_index[i].win_data = win_data->dataOf(i); | |
| 856 rnd_index[i].win_data_len = win_data->lengthOf(i); | |
| 857 #endif | |
| 858 }; | |
| 859 | |
| 860 ucnv_close(conv); | |
| 861 qsort(rnd_index, count, sizeof(DataIndex), CmdQsort::q_random); | |
| 862 | |
| 863 #define SORT(data, func) \ | |
| 864 data = new DataIndex[count];\ | |
| 865 memcpy(data, rnd_index, count * sizeof(DataIndex));\ | |
| 866 qsort(data, count, sizeof(DataIndex), CmdQsort::func) | |
| 867 | |
| 868 SORT(ord_icu_data, icu_strcoll_len); | |
| 869 SORT(ord_icu_key, icu_cmpkey); | |
| 870 SORT(ord_posix_data, posix_strcoll_null); | |
| 871 SORT(ord_posix_key, posix_cmpkey); | |
| 872 #if U_PLATFORM_HAS_WIN32_API | |
| 873 SORT(ord_win_data, win_cmp_len); | |
| 874 SORT(ord_win_key, win_cmpkey); | |
| 875 SORT(ord_win_wcscmp, win_wcscmp); | |
| 876 #endif | |
| 877 SORT(ord_icu_strcmp, icu_strcmp); | |
| 878 SORT(ord_icu_cmpcpo, icu_cmpcpo); | |
| 879 } | |
| 880 }; | |
| 881 | |
| 882 | |
| 883 int main(int argc, const char *argv[]) | |
| 884 { | |
| 885 | |
| 886 UErrorCode status = U_ZERO_ERROR; | |
| 887 CollPerfTest test(argc, argv, status); | |
| 888 | |
| 889 if (U_FAILURE(status)){ | |
| 890 printf("The error is %s\n", u_errorName(status)); | |
| 891 //TODO: print usage here | |
| 892 return status; | |
| 893 } | |
| 894 | |
| 895 if (test.run() == FALSE){ | |
| 896 fprintf(stderr, "FAILED: Tests could not be run please check the " | |
| 897 "arguments.\n"); | |
| 898 return -1; | |
| 899 } | |
| 900 return 0; | |
| 901 } | |
| 902 | |
| OLD | NEW |