OLD | NEW |
(Empty) | |
| 1 #include <wctype.h> |
| 2 #include "libc.h" |
| 3 |
| 4 #define CASEMAP(u1,u2,l) { (u1), (l)-(u1), (u2)-(u1)+1 } |
| 5 #define CASELACE(u1,u2) CASEMAP((u1),(u2),(u1)+1) |
| 6 |
| 7 static const struct { |
| 8 unsigned short upper; |
| 9 signed char lower; |
| 10 unsigned char len; |
| 11 } casemaps[] = { |
| 12 CASEMAP('A','Z','a'), |
| 13 CASEMAP(0xc0,0xde,0xe0), |
| 14 |
| 15 CASELACE(0x0100,0x012e), |
| 16 CASELACE(0x0132,0x0136), |
| 17 CASELACE(0x0139,0x0147), |
| 18 CASELACE(0x014a,0x0176), |
| 19 CASELACE(0x0179,0x017d), |
| 20 |
| 21 CASELACE(0x370,0x372), |
| 22 CASEMAP(0x391,0x3a1,0x3b1), |
| 23 CASEMAP(0x3a3,0x3ab,0x3c3), |
| 24 CASEMAP(0x400,0x40f,0x450), |
| 25 CASEMAP(0x410,0x42f,0x430), |
| 26 |
| 27 CASELACE(0x460,0x480), |
| 28 CASELACE(0x48a,0x4be), |
| 29 CASELACE(0x4c1,0x4cd), |
| 30 CASELACE(0x4d0,0x50e), |
| 31 |
| 32 CASELACE(0x514,0x526), |
| 33 CASEMAP(0x531,0x556,0x561), |
| 34 |
| 35 CASELACE(0x01a0,0x01a4), |
| 36 CASELACE(0x01b3,0x01b5), |
| 37 CASELACE(0x01cd,0x01db), |
| 38 CASELACE(0x01de,0x01ee), |
| 39 CASELACE(0x01f8,0x021e), |
| 40 CASELACE(0x0222,0x0232), |
| 41 CASELACE(0x03d8,0x03ee), |
| 42 |
| 43 CASELACE(0x1e00,0x1e94), |
| 44 CASELACE(0x1ea0,0x1efe), |
| 45 |
| 46 CASEMAP(0x1f08,0x1f0f,0x1f00), |
| 47 CASEMAP(0x1f18,0x1f1d,0x1f10), |
| 48 CASEMAP(0x1f28,0x1f2f,0x1f20), |
| 49 CASEMAP(0x1f38,0x1f3f,0x1f30), |
| 50 CASEMAP(0x1f48,0x1f4d,0x1f40), |
| 51 |
| 52 CASEMAP(0x1f68,0x1f6f,0x1f60), |
| 53 CASEMAP(0x1f88,0x1f8f,0x1f80), |
| 54 CASEMAP(0x1f98,0x1f9f,0x1f90), |
| 55 CASEMAP(0x1fa8,0x1faf,0x1fa0), |
| 56 CASEMAP(0x1fb8,0x1fb9,0x1fb0), |
| 57 CASEMAP(0x1fba,0x1fbb,0x1f70), |
| 58 CASEMAP(0x1fc8,0x1fcb,0x1f72), |
| 59 CASEMAP(0x1fd8,0x1fd9,0x1fd0), |
| 60 CASEMAP(0x1fda,0x1fdb,0x1f76), |
| 61 CASEMAP(0x1fe8,0x1fe9,0x1fe0), |
| 62 CASEMAP(0x1fea,0x1feb,0x1f7a), |
| 63 CASEMAP(0x1ff8,0x1ff9,0x1f78), |
| 64 CASEMAP(0x1ffa,0x1ffb,0x1f7c), |
| 65 |
| 66 CASELACE(0x246,0x24e), |
| 67 CASELACE(0x510,0x512), |
| 68 CASEMAP(0x2160,0x216f,0x2170), |
| 69 CASEMAP(0x2c00,0x2c2e,0x2c30), |
| 70 CASELACE(0x2c67,0x2c6b), |
| 71 CASELACE(0x2c80,0x2ce2), |
| 72 CASELACE(0x2ceb,0x2ced), |
| 73 |
| 74 CASELACE(0xa640,0xa66c), |
| 75 CASELACE(0xa680,0xa696), |
| 76 |
| 77 CASELACE(0xa722,0xa72e), |
| 78 CASELACE(0xa732,0xa76e), |
| 79 CASELACE(0xa779,0xa77b), |
| 80 CASELACE(0xa77e,0xa786), |
| 81 |
| 82 CASELACE(0xa790,0xa792), |
| 83 CASELACE(0xa7a0,0xa7a8), |
| 84 |
| 85 CASEMAP(0xff21,0xff3a,0xff41), |
| 86 { 0,0,0 } |
| 87 }; |
| 88 |
| 89 static const unsigned short pairs[][2] = { |
| 90 { 'I', 0x0131 }, |
| 91 { 'S', 0x017f }, |
| 92 { 0x0130, 'i' }, |
| 93 { 0x0178, 0x00ff }, |
| 94 { 0x0181, 0x0253 }, |
| 95 { 0x0182, 0x0183 }, |
| 96 { 0x0184, 0x0185 }, |
| 97 { 0x0186, 0x0254 }, |
| 98 { 0x0187, 0x0188 }, |
| 99 { 0x0189, 0x0256 }, |
| 100 { 0x018a, 0x0257 }, |
| 101 { 0x018b, 0x018c }, |
| 102 { 0x018e, 0x01dd }, |
| 103 { 0x018f, 0x0259 }, |
| 104 { 0x0190, 0x025b }, |
| 105 { 0x0191, 0x0192 }, |
| 106 { 0x0193, 0x0260 }, |
| 107 { 0x0194, 0x0263 }, |
| 108 { 0x0196, 0x0269 }, |
| 109 { 0x0197, 0x0268 }, |
| 110 { 0x0198, 0x0199 }, |
| 111 { 0x019c, 0x026f }, |
| 112 { 0x019d, 0x0272 }, |
| 113 { 0x019f, 0x0275 }, |
| 114 { 0x01a6, 0x0280 }, |
| 115 { 0x01a7, 0x01a8 }, |
| 116 { 0x01a9, 0x0283 }, |
| 117 { 0x01ac, 0x01ad }, |
| 118 { 0x01ae, 0x0288 }, |
| 119 { 0x01af, 0x01b0 }, |
| 120 { 0x01b1, 0x028a }, |
| 121 { 0x01b2, 0x028b }, |
| 122 { 0x01b7, 0x0292 }, |
| 123 { 0x01b8, 0x01b9 }, |
| 124 { 0x01bc, 0x01bd }, |
| 125 { 0x01c4, 0x01c6 }, |
| 126 { 0x01c4, 0x01c5 }, |
| 127 { 0x01c5, 0x01c6 }, |
| 128 { 0x01c7, 0x01c9 }, |
| 129 { 0x01c7, 0x01c8 }, |
| 130 { 0x01c8, 0x01c9 }, |
| 131 { 0x01ca, 0x01cc }, |
| 132 { 0x01ca, 0x01cb }, |
| 133 { 0x01cb, 0x01cc }, |
| 134 { 0x01f1, 0x01f3 }, |
| 135 { 0x01f1, 0x01f2 }, |
| 136 { 0x01f2, 0x01f3 }, |
| 137 { 0x01f4, 0x01f5 }, |
| 138 { 0x01f6, 0x0195 }, |
| 139 { 0x01f7, 0x01bf }, |
| 140 { 0x0220, 0x019e }, |
| 141 { 0x0386, 0x03ac }, |
| 142 { 0x0388, 0x03ad }, |
| 143 { 0x0389, 0x03ae }, |
| 144 { 0x038a, 0x03af }, |
| 145 { 0x038c, 0x03cc }, |
| 146 { 0x038e, 0x03cd }, |
| 147 { 0x038f, 0x03ce }, |
| 148 { 0x0399, 0x0345 }, |
| 149 { 0x0399, 0x1fbe }, |
| 150 { 0x03a3, 0x03c2 }, |
| 151 { 0x03f7, 0x03f8 }, |
| 152 { 0x03fa, 0x03fb }, |
| 153 { 0x1e60, 0x1e9b }, |
| 154 { 0x1e9e, 0xdf }, |
| 155 |
| 156 { 0x1f59, 0x1f51 }, |
| 157 { 0x1f5b, 0x1f53 }, |
| 158 { 0x1f5d, 0x1f55 }, |
| 159 { 0x1f5f, 0x1f57 }, |
| 160 { 0x1fbc, 0x1fb3 }, |
| 161 { 0x1fcc, 0x1fc3 }, |
| 162 { 0x1fec, 0x1fe5 }, |
| 163 { 0x1ffc, 0x1ff3 }, |
| 164 |
| 165 { 0x23a, 0x2c65 }, |
| 166 { 0x23b, 0x23c }, |
| 167 { 0x23d, 0x19a }, |
| 168 { 0x23e, 0x2c66 }, |
| 169 { 0x241, 0x242 }, |
| 170 { 0x243, 0x180 }, |
| 171 { 0x244, 0x289 }, |
| 172 { 0x245, 0x28c }, |
| 173 { 0x3f4, 0x3b8 }, |
| 174 { 0x3f9, 0x3f2 }, |
| 175 { 0x3fd, 0x37b }, |
| 176 { 0x3fe, 0x37c }, |
| 177 { 0x3ff, 0x37d }, |
| 178 { 0x4c0, 0x4cf }, |
| 179 |
| 180 { 0x2126, 0x3c9 }, |
| 181 { 0x212a, 'k' }, |
| 182 { 0x212b, 0xe5 }, |
| 183 { 0x2132, 0x214e }, |
| 184 { 0x2183, 0x2184 }, |
| 185 { 0x2c60, 0x2c61 }, |
| 186 { 0x2c62, 0x26b }, |
| 187 { 0x2c63, 0x1d7d }, |
| 188 { 0x2c64, 0x27d }, |
| 189 { 0x2c6d, 0x251 }, |
| 190 { 0x2c6e, 0x271 }, |
| 191 { 0x2c6f, 0x250 }, |
| 192 { 0x2c70, 0x252 }, |
| 193 { 0x2c72, 0x2c73 }, |
| 194 { 0x2c75, 0x2c76 }, |
| 195 { 0x2c7e, 0x23f }, |
| 196 { 0x2c7f, 0x240 }, |
| 197 { 0x2cf2, 0x2cf3 }, |
| 198 |
| 199 { 0xa77d, 0x1d79 }, |
| 200 { 0xa78b, 0xa78c }, |
| 201 { 0xa78d, 0x265 }, |
| 202 { 0xa7aa, 0x266 }, |
| 203 |
| 204 { 0x10c7, 0x2d27 }, |
| 205 { 0x10cd, 0x2d2d }, |
| 206 |
| 207 /* bogus greek 'symbol' letters */ |
| 208 { 0x376, 0x377 }, |
| 209 { 0x39c, 0xb5 }, |
| 210 { 0x392, 0x3d0 }, |
| 211 { 0x398, 0x3d1 }, |
| 212 { 0x3a6, 0x3d5 }, |
| 213 { 0x3a0, 0x3d6 }, |
| 214 { 0x39a, 0x3f0 }, |
| 215 { 0x3a1, 0x3f1 }, |
| 216 { 0x395, 0x3f5 }, |
| 217 { 0x3cf, 0x3d7 }, |
| 218 |
| 219 { 0,0 } |
| 220 }; |
| 221 |
| 222 |
| 223 static wchar_t __towcase(wchar_t wc, int lower) |
| 224 { |
| 225 int i; |
| 226 int lmul = 2*lower-1; |
| 227 int lmask = lower-1; |
| 228 /* no letters with case in these large ranges */ |
| 229 if (!iswalpha(wc) |
| 230 || (unsigned)wc - 0x0600 <= 0x0fff-0x0600 |
| 231 || (unsigned)wc - 0x2e00 <= 0xa63f-0x2e00 |
| 232 || (unsigned)wc - 0xa800 <= 0xfeff-0xa800) |
| 233 return wc; |
| 234 /* special case because the diff between upper/lower is too big */ |
| 235 if (lower && (unsigned)wc - 0x10a0 < 0x2e) |
| 236 if (wc>0x10c5 && wc != 0x10c7 && wc != 0x10cd) return wc; |
| 237 else return wc + 0x2d00 - 0x10a0; |
| 238 if (!lower && (unsigned)wc - 0x2d00 < 0x26) |
| 239 if (wc>0x2d25 && wc != 0x2d27 && wc != 0x2d2d) return wc; |
| 240 else return wc + 0x10a0 - 0x2d00; |
| 241 for (i=0; casemaps[i].len; i++) { |
| 242 int base = casemaps[i].upper + (lmask & casemaps[i].lower); |
| 243 if ((unsigned)wc-base < casemaps[i].len) { |
| 244 if (casemaps[i].lower == 1) |
| 245 return wc + lower - ((wc-casemaps[i].upper)&1); |
| 246 return wc + lmul*casemaps[i].lower; |
| 247 } |
| 248 } |
| 249 for (i=0; pairs[i][1-lower]; i++) { |
| 250 if (pairs[i][1-lower] == wc) |
| 251 return pairs[i][lower]; |
| 252 } |
| 253 if ((unsigned)wc - (0x10428 - 0x28*lower) < 0x28) |
| 254 return wc - 0x28 + 0x50*lower; |
| 255 return wc; |
| 256 } |
| 257 |
| 258 wint_t towupper(wint_t wc) |
| 259 { |
| 260 return __towcase(wc, 0); |
| 261 } |
| 262 |
| 263 wint_t towlower(wint_t wc) |
| 264 { |
| 265 return __towcase(wc, 1); |
| 266 } |
| 267 |
| 268 wint_t __towupper_l(wint_t c, locale_t l) |
| 269 { |
| 270 return towupper(c); |
| 271 } |
| 272 |
| 273 wint_t __towlower_l(wint_t c, locale_t l) |
| 274 { |
| 275 return towlower(c); |
| 276 } |
| 277 |
| 278 weak_alias(__towupper_l, towupper_l); |
| 279 weak_alias(__towlower_l, towlower_l); |
OLD | NEW |