OLD | NEW |
| (Empty) |
1 /* | |
2 * Copyright (C) 2008 Nokia Corporation and/or its subsidiary(-ies) | |
3 * | |
4 * This is part of HarfBuzz, an OpenType Layout engine library. | |
5 * | |
6 * Permission is hereby granted, without written agreement and without | |
7 * license or royalty fees, to use, copy, modify, and distribute this | |
8 * software and its documentation for any purpose, provided that the | |
9 * above copyright notice and the following two paragraphs appear in | |
10 * all copies of this software. | |
11 * | |
12 * IN NO EVENT SHALL THE COPYRIGHT HOLDER BE LIABLE TO ANY PARTY FOR | |
13 * DIRECT, INDIRECT, SPECIAL, INCIDENTAL, OR CONSEQUENTIAL DAMAGES | |
14 * ARISING OUT OF THE USE OF THIS SOFTWARE AND ITS DOCUMENTATION, EVEN | |
15 * IF THE COPYRIGHT HOLDER HAS BEEN ADVISED OF THE POSSIBILITY OF SUCH | |
16 * DAMAGE. | |
17 * | |
18 * THE COPYRIGHT HOLDER SPECIFICALLY DISCLAIMS ANY WARRANTIES, INCLUDING, | |
19 * BUT NOT LIMITED TO, THE IMPLIED WARRANTIES OF MERCHANTABILITY AND | |
20 * FITNESS FOR A PARTICULAR PURPOSE. THE SOFTWARE PROVIDED HEREUNDER IS | |
21 * ON AN "AS IS" BASIS, AND THE COPYRIGHT HOLDER HAS NO OBLIGATION TO | |
22 * PROVIDE MAINTENANCE, SUPPORT, UPDATES, ENHANCEMENTS, OR MODIFICATIONS. | |
23 */ | |
24 | |
25 #include "harfbuzz-shaper.h" | |
26 #include "harfbuzz-shaper-private.h" | |
27 | |
28 #include <assert.h> | |
29 | |
30 static const HB_UChar16 ReplacementCharacter = 0xfffd; | |
31 | |
32 typedef struct { | |
33 unsigned char shape; | |
34 unsigned char justification; | |
35 } HB_ArabicProperties; | |
36 | |
37 typedef enum { | |
38 XIsolated, | |
39 XFinal, | |
40 XInitial, | |
41 XMedial, | |
42 /* intermediate state */ | |
43 XCausing | |
44 } ArabicShape; | |
45 | |
46 /* | |
47 // these groups correspond to the groups defined in the Unicode standard. | |
48 // Some of these groups are equal with regards to both joining and line breaking
behaviour, | |
49 // and thus have the same enum value | |
50 // | |
51 // I'm not sure the mapping of syriac to arabic enums is correct with regards to
justification, but as | |
52 // I couldn't find any better document I'll hope for the best. | |
53 */ | |
54 typedef enum { | |
55 /* NonJoining */ | |
56 ArabicNone, | |
57 ArabicSpace, | |
58 /* Transparent */ | |
59 Transparent, | |
60 /* Causing */ | |
61 Center, | |
62 Kashida, | |
63 | |
64 /* Arabic */ | |
65 /* Dual */ | |
66 Beh, | |
67 Noon, | |
68 Meem = Noon, | |
69 Heh = Noon, | |
70 KnottedHeh = Noon, | |
71 HehGoal = Noon, | |
72 SwashKaf = Noon, | |
73 Yeh, | |
74 Hah, | |
75 Seen, | |
76 Sad = Seen, | |
77 Tah, | |
78 Kaf = Tah, | |
79 Gaf = Tah, | |
80 Lam = Tah, | |
81 Ain, | |
82 Feh = Ain, | |
83 Qaf = Ain, | |
84 /* Right */ | |
85 Alef, | |
86 Waw, | |
87 Dal, | |
88 TehMarbuta = Dal, | |
89 Reh, | |
90 HamzaOnHehGoal, | |
91 YehWithTail = HamzaOnHehGoal, | |
92 YehBarre = HamzaOnHehGoal, | |
93 | |
94 /* Syriac */ | |
95 /* Dual */ | |
96 Beth = Beh, | |
97 Gamal = Ain, | |
98 Heth = Noon, | |
99 Teth = Hah, | |
100 Yudh = Noon, | |
101 Kaph = Noon, | |
102 Lamadh = Lam, | |
103 Mim = Noon, | |
104 Nun = Noon, | |
105 Semakh = Noon, | |
106 FinalSemakh = Noon, | |
107 SyriacE = Ain, | |
108 Pe = Ain, | |
109 ReversedPe = Hah, | |
110 Qaph = Noon, | |
111 Shin = Noon, | |
112 Fe = Ain, | |
113 | |
114 /* Right */ | |
115 Alaph = Alef, | |
116 Dalath = Dal, | |
117 He = Dal, | |
118 SyriacWaw = Waw, | |
119 Zain = Alef, | |
120 YudhHe = Waw, | |
121 Sadhe = HamzaOnHehGoal, | |
122 Taw = Dal, | |
123 | |
124 /* Compiler bug? Otherwise ArabicGroupsEnd would be equal to Dal + 1. */ | |
125 Dummy = HamzaOnHehGoal, | |
126 ArabicGroupsEnd | |
127 } ArabicGroup; | |
128 | |
129 static const unsigned char arabic_group[0x150] = { | |
130 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
131 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
132 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
133 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
134 | |
135 Transparent, Transparent, Transparent, Transparent, | |
136 Transparent, Transparent, ArabicNone, ArabicNone, | |
137 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
138 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
139 | |
140 ArabicNone, ArabicNone, Alef, Alef, | |
141 Waw, Alef, Yeh, Alef, | |
142 Beh, TehMarbuta, Beh, Beh, | |
143 Hah, Hah, Hah, Dal, | |
144 | |
145 Dal, Reh, Reh, Seen, | |
146 Seen, Sad, Sad, Tah, | |
147 Tah, Ain, Ain, ArabicNone, | |
148 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
149 | |
150 /* 0x640 */ | |
151 Kashida, Feh, Qaf, Kaf, | |
152 Lam, Meem, Noon, Heh, | |
153 Waw, Yeh, Yeh, Transparent, | |
154 Transparent, Transparent, Transparent, Transparent, | |
155 | |
156 Transparent, Transparent, Transparent, Transparent, | |
157 Transparent, Transparent, Transparent, Transparent, | |
158 Transparent, ArabicNone, ArabicNone, ArabicNone, | |
159 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
160 | |
161 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
162 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
163 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
164 ArabicNone, ArabicNone, Beh, Qaf, | |
165 | |
166 Transparent, Alef, Alef, Alef, | |
167 ArabicNone, Alef, Waw, Waw, | |
168 Yeh, Beh, Beh, Beh, | |
169 Beh, Beh, Beh, Beh, | |
170 | |
171 /* 0x680 */ | |
172 Beh, Hah, Hah, Hah, | |
173 Hah, Hah, Hah, Hah, | |
174 Dal, Dal, Dal, Dal, | |
175 Dal, Dal, Dal, Dal, | |
176 | |
177 Dal, Reh, Reh, Reh, | |
178 Reh, Reh, Reh, Reh, | |
179 Reh, Reh, Seen, Seen, | |
180 Seen, Sad, Sad, Tah, | |
181 | |
182 Ain, Feh, Feh, Feh, | |
183 Feh, Feh, Feh, Qaf, | |
184 Qaf, Gaf, SwashKaf, Gaf, | |
185 Kaf, Kaf, Kaf, Gaf, | |
186 | |
187 Gaf, Gaf, Gaf, Gaf, | |
188 Gaf, Lam, Lam, Lam, | |
189 Lam, Noon, Noon, Noon, | |
190 Noon, Noon, KnottedHeh, Hah, | |
191 | |
192 /* 0x6c0 */ | |
193 TehMarbuta, HehGoal, HamzaOnHehGoal, HamzaOnHehGoal, | |
194 Waw, Waw, Waw, Waw, | |
195 Waw, Waw, Waw, Waw, | |
196 Yeh, YehWithTail, Yeh, Waw, | |
197 | |
198 Yeh, Yeh, YehBarre, YehBarre, | |
199 ArabicNone, TehMarbuta, Transparent, Transparent, | |
200 Transparent, Transparent, Transparent, Transparent, | |
201 Transparent, ArabicNone, ArabicNone, Transparent, | |
202 | |
203 Transparent, Transparent, Transparent, Transparent, | |
204 Transparent, ArabicNone, ArabicNone, Transparent, | |
205 Transparent, ArabicNone, Transparent, Transparent, | |
206 Transparent, Transparent, Dal, Reh, | |
207 | |
208 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
209 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
210 ArabicNone, ArabicNone, Seen, Sad, | |
211 Ain, ArabicNone, ArabicNone, KnottedHeh, | |
212 | |
213 /* 0x700 */ | |
214 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
215 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
216 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
217 ArabicNone, ArabicNone, ArabicNone, ArabicNone, | |
218 | |
219 Alaph, Transparent, Beth, Gamal, | |
220 Gamal, Dalath, Dalath, He, | |
221 SyriacWaw, Zain, Heth, Teth, | |
222 Teth, Yudh, YudhHe, Kaph, | |
223 | |
224 Lamadh, Mim, Nun, Semakh, | |
225 FinalSemakh, SyriacE, Pe, ReversedPe, | |
226 Sadhe, Qaph, Dalath, Shin, | |
227 Taw, Beth, Gamal, Dalath, | |
228 | |
229 Transparent, Transparent, Transparent, Transparent, | |
230 Transparent, Transparent, Transparent, Transparent, | |
231 Transparent, Transparent, Transparent, Transparent, | |
232 Transparent, Transparent, Transparent, Transparent, | |
233 | |
234 Transparent, Transparent, Transparent, Transparent, | |
235 Transparent, Transparent, Transparent, Transparent, | |
236 Transparent, Transparent, Transparent, ArabicNone, | |
237 ArabicNone, Zain, Kaph, Fe, | |
238 }; | |
239 | |
240 static ArabicGroup arabicGroup(unsigned short uc) | |
241 { | |
242 if (uc >= 0x0600 && uc < 0x750) | |
243 return (ArabicGroup) arabic_group[uc-0x600]; | |
244 else if (uc == 0x200d) | |
245 return Center; | |
246 else if (HB_GetUnicodeCharCategory(uc) == HB_Separator_Space) | |
247 return ArabicSpace; | |
248 else | |
249 return ArabicNone; | |
250 } | |
251 | |
252 | |
253 /* | |
254 Arabic shaping obeys a number of rules according to the joining classes (see
Unicode book, section on | |
255 arabic). | |
256 | |
257 Each unicode char has a joining class (right, dual (left&right), center (join
causing) or transparent). | |
258 transparent joining is not encoded in HB_UChar16::joining(), but applies to a
ll combining marks and format marks. | |
259 | |
260 Right join-causing: dual + center | |
261 Left join-causing: dual + right + center | |
262 | |
263 Rules are as follows (for a string already in visual order, as we have it her
e): | |
264 | |
265 R1 Transparent characters do not affect joining behaviour. | |
266 R2 A right joining character, that has a right join-causing char on the right
will get form XRight | |
267 (R3 A left joining character, that has a left join-causing char on the left w
ill get form XLeft) | |
268 Note: the above rule is meaningless, as there are no pure left joining charac
ters defined in Unicode | |
269 R4 A dual joining character, that has a left join-causing char on the left an
d a right join-causing char on | |
270 the right will get form XMedial | |
271 R5 A dual joining character, that has a right join causing char on the right
, and no left join causing char on the left | |
272 will get form XRight | |
273 R6 A dual joining character, that has a left join causing char on the left,
and no right join causing char on the right | |
274 will get form XLeft | |
275 R7 Otherwise the character will get form XIsolated | |
276 | |
277 Additionally we have to do the minimal ligature support for lam-alef ligature
s: | |
278 | |
279 L1 Transparent characters do not affect ligature behaviour. | |
280 L2 Any sequence of Alef(XRight) + Lam(XMedial) will form the ligature Alef.La
m(XLeft) | |
281 L3 Any sequence of Alef(XRight) + Lam(XLeft) will form the ligature Alef.Lam(
XIsolated) | |
282 | |
283 The state table below handles rules R1-R7. | |
284 */ | |
285 | |
286 typedef enum { | |
287 JNone, | |
288 JCausing, | |
289 JDual, | |
290 JRight, | |
291 JTransparent | |
292 } Joining; | |
293 | |
294 static const Joining joining_for_group[ArabicGroupsEnd] = { | |
295 /* NonJoining */ | |
296 JNone, /* ArabicNone */ | |
297 JNone, /* ArabicSpace */ | |
298 /* Transparent */ | |
299 JTransparent, /* Transparent */ | |
300 /* Causing */ | |
301 JCausing, /* Center */ | |
302 JCausing, /* Kashida */ | |
303 /* Dual */ | |
304 JDual, /* Beh */ | |
305 JDual, /* Noon */ | |
306 JDual, /* Yeh */ | |
307 JDual, /* Hah */ | |
308 JDual, /* Seen */ | |
309 JDual, /* Tah */ | |
310 JDual, /* Ain */ | |
311 /* Right */ | |
312 JRight, /* Alef */ | |
313 JRight, /* Waw */ | |
314 JRight, /* Dal */ | |
315 JRight, /* Reh */ | |
316 JRight /* HamzaOnHehGoal */ | |
317 }; | |
318 | |
319 | |
320 typedef struct { | |
321 ArabicShape form1; | |
322 ArabicShape form2; | |
323 } JoiningPair; | |
324 | |
325 static const JoiningPair joining_table[5][4] = | |
326 /* None, Causing, Dual, Right */ | |
327 { | |
328 { { XIsolated, XIsolated }, { XIsolated, XCausing }, { XIsolated, XInitial }
, { XIsolated, XIsolated } }, /* XIsolated */ | |
329 { { XFinal, XIsolated }, { XFinal, XCausing }, { XFinal, XInitial }, { XFina
l, XIsolated } }, /* XFinal */ | |
330 { { XIsolated, XIsolated }, { XInitial, XCausing }, { XInitial, XMedial }, {
XInitial, XFinal } }, /* XInitial */ | |
331 { { XFinal, XIsolated }, { XMedial, XCausing }, { XMedial, XMedial }, { XMed
ial, XFinal } }, /* XMedial */ | |
332 { { XIsolated, XIsolated }, { XIsolated, XCausing }, { XIsolated, XMedial },
{ XIsolated, XFinal } }, /* XCausing */ | |
333 }; | |
334 | |
335 | |
336 /* | |
337 According to http://www.microsoft.com/middleeast/Arabicdev/IE6/KBase.asp | |
338 | |
339 1. Find the priority of the connecting opportunities in each word | |
340 2. Add expansion at the highest priority connection opportunity | |
341 3. If more than one connection opportunity have the same highest value, | |
342 use the opportunity closest to the end of the word. | |
343 | |
344 Following is a chart that provides the priority for connection | |
345 opportunities and where expansion occurs. The character group names | |
346 are those in table 6.6 of the UNICODE 2.0 book. | |
347 | |
348 | |
349 PrioritY Glyph Condition
Kashida Location | |
350 | |
351 Arabic_Kashida User inserted Kashida The user entered a Kashida in a po
sition. After the user | |
352 (Shift+j or Shift+[E with hat]) Thus, it is the highest prior
ity to insert an inserted kashida | |
353 automatic kashida. | |
354 | |
355 Arabic_Seen Seen, Sad Connecting to the next character.
After the character. | |
356 (Initial or medial form). | |
357 | |
358 Arabic_HaaDal Teh Marbutah, Haa, Dal Connecting to previous character.
Before the final form | |
359
of these characters. | |
360 | |
361 Arabic_Alef Alef, Tah, Lam, Connecting to previous character.
Before the final form | |
362 Kaf and Gaf
of these characters. | |
363 | |
364 Arabic_BaRa Reh, Yeh Connected to medial Beh
Before preceding medial Baa | |
365 | |
366 Arabic_Waw Waw, Ain, Qaf, Feh Connecting to previous character.
Before the final form of | |
367
these characters. | |
368 | |
369 Arabic_Normal Other connecting Connecting to previous character.
Before the final form | |
370 characters
of these characters. | |
371 | |
372 | |
373 | |
374 This seems to imply that we have at most one kashida point per arabic word. | |
375 | |
376 */ | |
377 | |
378 static void getArabicProperties(const unsigned short *chars, int len, HB_ArabicP
roperties *properties) | |
379 { | |
380 /* qDebug("arabicSyriacOpenTypeShape: properties:"); */ | |
381 int lastPos = 0; | |
382 int lastGroup = ArabicNone; | |
383 int i = 0; | |
384 | |
385 ArabicGroup group = arabicGroup(chars[0]); | |
386 Joining j = joining_for_group[group]; | |
387 ArabicShape shape = joining_table[XIsolated][j].form2; | |
388 properties[0].justification = HB_NoJustification; | |
389 | |
390 for (i = 1; i < len; ++i) { | |
391 /* #### fix handling for spaces and punktuation */ | |
392 properties[i].justification = HB_NoJustification; | |
393 | |
394 group = arabicGroup(chars[i]); | |
395 j = joining_for_group[group]; | |
396 | |
397 if (j == JTransparent) { | |
398 properties[i].shape = XIsolated; | |
399 continue; | |
400 } | |
401 | |
402 properties[lastPos].shape = joining_table[shape][j].form1; | |
403 shape = joining_table[shape][j].form2; | |
404 | |
405 switch(lastGroup) { | |
406 case Seen: | |
407 if (properties[lastPos].shape == XInitial || properties[lastPos].sha
pe == XMedial) | |
408 properties[i-1].justification = HB_Arabic_Seen; | |
409 break; | |
410 case Hah: | |
411 if (properties[lastPos].shape == XFinal) | |
412 properties[lastPos-1].justification = HB_Arabic_HaaDal; | |
413 break; | |
414 case Alef: | |
415 if (properties[lastPos].shape == XFinal) | |
416 properties[lastPos-1].justification = HB_Arabic_Alef; | |
417 break; | |
418 case Ain: | |
419 if (properties[lastPos].shape == XFinal) | |
420 properties[lastPos-1].justification = HB_Arabic_Waw; | |
421 break; | |
422 case Noon: | |
423 if (properties[lastPos].shape == XFinal) | |
424 properties[lastPos-1].justification = HB_Arabic_Normal; | |
425 break; | |
426 case ArabicNone: | |
427 break; | |
428 | |
429 default: | |
430 assert(FALSE); | |
431 } | |
432 | |
433 lastGroup = ArabicNone; | |
434 | |
435 switch(group) { | |
436 case ArabicNone: | |
437 case Transparent: | |
438 /* ### Center should probably be treated as transparent when it comes to
justification. */ | |
439 case Center: | |
440 break; | |
441 case ArabicSpace: | |
442 properties[i].justification = HB_Arabic_Space; | |
443 break; | |
444 case Kashida: | |
445 properties[i].justification = HB_Arabic_Kashida; | |
446 break; | |
447 case Seen: | |
448 lastGroup = Seen; | |
449 break; | |
450 | |
451 case Hah: | |
452 case Dal: | |
453 lastGroup = Hah; | |
454 break; | |
455 | |
456 case Alef: | |
457 case Tah: | |
458 lastGroup = Alef; | |
459 break; | |
460 | |
461 case Yeh: | |
462 case Reh: | |
463 if (properties[lastPos].shape == XMedial && arabicGroup(chars[lastPo
s]) == Beh) | |
464 properties[lastPos-1].justification = HB_Arabic_BaRa; | |
465 break; | |
466 | |
467 case Ain: | |
468 case Waw: | |
469 lastGroup = Ain; | |
470 break; | |
471 | |
472 case Noon: | |
473 case Beh: | |
474 case HamzaOnHehGoal: | |
475 lastGroup = Noon; | |
476 break; | |
477 case ArabicGroupsEnd: | |
478 assert(FALSE); | |
479 } | |
480 | |
481 lastPos = i; | |
482 } | |
483 properties[lastPos].shape = joining_table[shape][JNone].form1; | |
484 | |
485 | |
486 /* | |
487 for (int i = 0; i < len; ++i) | |
488 qDebug("arabic properties(%d): uc=%x shape=%d, justification=%d", i, ch
ars[i], properties[i].shape, properties[i].justification); | |
489 */ | |
490 } | |
491 | |
492 static Joining getNkoJoining(unsigned short uc) | |
493 { | |
494 if (uc < 0x7ca) | |
495 return JNone; | |
496 if (uc <= 0x7ea) | |
497 return JDual; | |
498 if (uc <= 0x7f3) | |
499 return JTransparent; | |
500 if (uc <= 0x7f9) | |
501 return JNone; | |
502 if (uc == 0x7fa) | |
503 return JCausing; | |
504 return JNone; | |
505 } | |
506 | |
507 static void getNkoProperties(const unsigned short *chars, int len, HB_ArabicProp
erties *properties) | |
508 { | |
509 int lastPos = 0; | |
510 int i = 0; | |
511 | |
512 Joining j = getNkoJoining(chars[0]); | |
513 ArabicShape shape = joining_table[XIsolated][j].form2; | |
514 properties[0].justification = HB_NoJustification; | |
515 | |
516 for (i = 1; i < len; ++i) { | |
517 properties[i].justification = (HB_GetUnicodeCharCategory(chars[i]) == HB
_Separator_Space) ? | |
518 ArabicSpace : ArabicNone; | |
519 | |
520 j = getNkoJoining(chars[i]); | |
521 | |
522 if (j == JTransparent) { | |
523 properties[i].shape = XIsolated; | |
524 continue; | |
525 } | |
526 | |
527 properties[lastPos].shape = joining_table[shape][j].form1; | |
528 shape = joining_table[shape][j].form2; | |
529 | |
530 | |
531 lastPos = i; | |
532 } | |
533 properties[lastPos].shape = joining_table[shape][JNone].form1; | |
534 | |
535 | |
536 /* | |
537 for (int i = 0; i < len; ++i) | |
538 qDebug("nko properties(%d): uc=%x shape=%d, justification=%d", i, chars
[i], properties[i].shape, properties[i].justification); | |
539 */ | |
540 } | |
541 | |
542 /* | |
543 // The unicode to unicode shaping codec. | |
544 // does only presentation forms B at the moment, but that should be enough for | |
545 // simple display | |
546 */ | |
547 static const hb_uint16 arabicUnicodeMapping[256][2] = { | |
548 /* base of shaped forms, and number-1 of them (0 for non shaping, | |
549 1 for right binding and 3 for dual binding */ | |
550 | |
551 /* These are just the glyphs available in Unicode, | |
552 some characters are in R class, but have no glyphs in Unicode. */ | |
553 | |
554 { 0x0600, 0 }, /* 0x0600 */ | |
555 { 0x0601, 0 }, /* 0x0601 */ | |
556 { 0x0602, 0 }, /* 0x0602 */ | |
557 { 0x0603, 0 }, /* 0x0603 */ | |
558 { 0x0604, 0 }, /* 0x0604 */ | |
559 { 0x0605, 0 }, /* 0x0605 */ | |
560 { 0x0606, 0 }, /* 0x0606 */ | |
561 { 0x0607, 0 }, /* 0x0607 */ | |
562 { 0x0608, 0 }, /* 0x0608 */ | |
563 { 0x0609, 0 }, /* 0x0609 */ | |
564 { 0x060A, 0 }, /* 0x060A */ | |
565 { 0x060B, 0 }, /* 0x060B */ | |
566 { 0x060C, 0 }, /* 0x060C */ | |
567 { 0x060D, 0 }, /* 0x060D */ | |
568 { 0x060E, 0 }, /* 0x060E */ | |
569 { 0x060F, 0 }, /* 0x060F */ | |
570 | |
571 { 0x0610, 0 }, /* 0x0610 */ | |
572 { 0x0611, 0 }, /* 0x0611 */ | |
573 { 0x0612, 0 }, /* 0x0612 */ | |
574 { 0x0613, 0 }, /* 0x0613 */ | |
575 { 0x0614, 0 }, /* 0x0614 */ | |
576 { 0x0615, 0 }, /* 0x0615 */ | |
577 { 0x0616, 0 }, /* 0x0616 */ | |
578 { 0x0617, 0 }, /* 0x0617 */ | |
579 { 0x0618, 0 }, /* 0x0618 */ | |
580 { 0x0619, 0 }, /* 0x0619 */ | |
581 { 0x061A, 0 }, /* 0x061A */ | |
582 { 0x061B, 0 }, /* 0x061B */ | |
583 { 0x061C, 0 }, /* 0x061C */ | |
584 { 0x061D, 0 }, /* 0x061D */ | |
585 { 0x061E, 0 }, /* 0x061E */ | |
586 { 0x061F, 0 }, /* 0x061F */ | |
587 | |
588 { 0x0620, 0 }, /* 0x0620 */ | |
589 { 0xFE80, 0 }, /* 0x0621 HAMZA */ | |
590 { 0xFE81, 1 }, /* 0x0622 R ALEF WITH MADDA ABOVE */ | |
591 { 0xFE83, 1 }, /* 0x0623 R ALEF WITH HAMZA ABOVE */ | |
592 { 0xFE85, 1 }, /* 0x0624 R WAW WITH HAMZA ABOVE */ | |
593 { 0xFE87, 1 }, /* 0x0625 R ALEF WITH HAMZA BELOW */ | |
594 { 0xFE89, 3 }, /* 0x0626 D YEH WITH HAMZA ABOVE */ | |
595 { 0xFE8D, 1 }, /* 0x0627 R ALEF */ | |
596 { 0xFE8F, 3 }, /* 0x0628 D BEH */ | |
597 { 0xFE93, 1 }, /* 0x0629 R TEH MARBUTA */ | |
598 { 0xFE95, 3 }, /* 0x062A D TEH */ | |
599 { 0xFE99, 3 }, /* 0x062B D THEH */ | |
600 { 0xFE9D, 3 }, /* 0x062C D JEEM */ | |
601 { 0xFEA1, 3 }, /* 0x062D D HAH */ | |
602 { 0xFEA5, 3 }, /* 0x062E D KHAH */ | |
603 { 0xFEA9, 1 }, /* 0x062F R DAL */ | |
604 | |
605 { 0xFEAB, 1 }, /* 0x0630 R THAL */ | |
606 { 0xFEAD, 1 }, /* 0x0631 R REH */ | |
607 { 0xFEAF, 1 }, /* 0x0632 R ZAIN */ | |
608 { 0xFEB1, 3 }, /* 0x0633 D SEEN */ | |
609 { 0xFEB5, 3 }, /* 0x0634 D SHEEN */ | |
610 { 0xFEB9, 3 }, /* 0x0635 D SAD */ | |
611 { 0xFEBD, 3 }, /* 0x0636 D DAD */ | |
612 { 0xFEC1, 3 }, /* 0x0637 D TAH */ | |
613 { 0xFEC5, 3 }, /* 0x0638 D ZAH */ | |
614 { 0xFEC9, 3 }, /* 0x0639 D AIN */ | |
615 { 0xFECD, 3 }, /* 0x063A D GHAIN */ | |
616 { 0x063B, 0 }, /* 0x063B */ | |
617 { 0x063C, 0 }, /* 0x063C */ | |
618 { 0x063D, 0 }, /* 0x063D */ | |
619 { 0x063E, 0 }, /* 0x063E */ | |
620 { 0x063F, 0 }, /* 0x063F */ | |
621 | |
622 { 0x0640, 0 }, /* 0x0640 C TATWEEL // ### Join Causing, only one gl
yph */ | |
623 { 0xFED1, 3 }, /* 0x0641 D FEH */ | |
624 { 0xFED5, 3 }, /* 0x0642 D QAF */ | |
625 { 0xFED9, 3 }, /* 0x0643 D KAF */ | |
626 { 0xFEDD, 3 }, /* 0x0644 D LAM */ | |
627 { 0xFEE1, 3 }, /* 0x0645 D MEEM */ | |
628 { 0xFEE5, 3 }, /* 0x0646 D NOON */ | |
629 { 0xFEE9, 3 }, /* 0x0647 D HEH */ | |
630 { 0xFEED, 1 }, /* 0x0648 R WAW */ | |
631 { 0x0649, 3 }, /* 0x0649 ALEF MAKSURA // ### Dual, glyphs not con
secutive, handle in code. */ | |
632 { 0xFEF1, 3 }, /* 0x064A D YEH */ | |
633 { 0x064B, 0 }, /* 0x064B */ | |
634 { 0x064C, 0 }, /* 0x064C */ | |
635 { 0x064D, 0 }, /* 0x064D */ | |
636 { 0x064E, 0 }, /* 0x064E */ | |
637 { 0x064F, 0 }, /* 0x064F */ | |
638 | |
639 { 0x0650, 0 }, /* 0x0650 */ | |
640 { 0x0651, 0 }, /* 0x0651 */ | |
641 { 0x0652, 0 }, /* 0x0652 */ | |
642 { 0x0653, 0 }, /* 0x0653 */ | |
643 { 0x0654, 0 }, /* 0x0654 */ | |
644 { 0x0655, 0 }, /* 0x0655 */ | |
645 { 0x0656, 0 }, /* 0x0656 */ | |
646 { 0x0657, 0 }, /* 0x0657 */ | |
647 { 0x0658, 0 }, /* 0x0658 */ | |
648 { 0x0659, 0 }, /* 0x0659 */ | |
649 { 0x065A, 0 }, /* 0x065A */ | |
650 { 0x065B, 0 }, /* 0x065B */ | |
651 { 0x065C, 0 }, /* 0x065C */ | |
652 { 0x065D, 0 }, /* 0x065D */ | |
653 { 0x065E, 0 }, /* 0x065E */ | |
654 { 0x065F, 0 }, /* 0x065F */ | |
655 | |
656 { 0x0660, 0 }, /* 0x0660 */ | |
657 { 0x0661, 0 }, /* 0x0661 */ | |
658 { 0x0662, 0 }, /* 0x0662 */ | |
659 { 0x0663, 0 }, /* 0x0663 */ | |
660 { 0x0664, 0 }, /* 0x0664 */ | |
661 { 0x0665, 0 }, /* 0x0665 */ | |
662 { 0x0666, 0 }, /* 0x0666 */ | |
663 { 0x0667, 0 }, /* 0x0667 */ | |
664 { 0x0668, 0 }, /* 0x0668 */ | |
665 { 0x0669, 0 }, /* 0x0669 */ | |
666 { 0x066A, 0 }, /* 0x066A */ | |
667 { 0x066B, 0 }, /* 0x066B */ | |
668 { 0x066C, 0 }, /* 0x066C */ | |
669 { 0x066D, 0 }, /* 0x066D */ | |
670 { 0x066E, 0 }, /* 0x066E */ | |
671 { 0x066F, 0 }, /* 0x066F */ | |
672 | |
673 { 0x0670, 0 }, /* 0x0670 */ | |
674 { 0xFB50, 1 }, /* 0x0671 R ALEF WASLA */ | |
675 { 0x0672, 0 }, /* 0x0672 */ | |
676 { 0x0673, 0 }, /* 0x0673 */ | |
677 { 0x0674, 0 }, /* 0x0674 */ | |
678 { 0x0675, 0 }, /* 0x0675 */ | |
679 { 0x0676, 0 }, /* 0x0676 */ | |
680 { 0x0677, 0 }, /* 0x0677 */ | |
681 { 0x0678, 0 }, /* 0x0678 */ | |
682 { 0xFB66, 3 }, /* 0x0679 D TTEH */ | |
683 { 0xFB5E, 3 }, /* 0x067A D TTEHEH */ | |
684 { 0xFB52, 3 }, /* 0x067B D BEEH */ | |
685 { 0x067C, 0 }, /* 0x067C */ | |
686 { 0x067D, 0 }, /* 0x067D */ | |
687 { 0xFB56, 3 }, /* 0x067E D PEH */ | |
688 { 0xFB62, 3 }, /* 0x067F D TEHEH */ | |
689 | |
690 { 0xFB5A, 3 }, /* 0x0680 D BEHEH */ | |
691 { 0x0681, 0 }, /* 0x0681 */ | |
692 { 0x0682, 0 }, /* 0x0682 */ | |
693 { 0xFB76, 3 }, /* 0x0683 D NYEH */ | |
694 { 0xFB72, 3 }, /* 0x0684 D DYEH */ | |
695 { 0x0685, 0 }, /* 0x0685 */ | |
696 { 0xFB7A, 3 }, /* 0x0686 D TCHEH */ | |
697 { 0xFB7E, 3 }, /* 0x0687 D TCHEHEH */ | |
698 { 0xFB88, 1 }, /* 0x0688 R DDAL */ | |
699 { 0x0689, 0 }, /* 0x0689 */ | |
700 { 0x068A, 0 }, /* 0x068A */ | |
701 { 0x068B, 0 }, /* 0x068B */ | |
702 { 0xFB84, 1 }, /* 0x068C R DAHAL */ | |
703 { 0xFB82, 1 }, /* 0x068D R DDAHAL */ | |
704 { 0xFB86, 1 }, /* 0x068E R DUL */ | |
705 { 0x068F, 0 }, /* 0x068F */ | |
706 | |
707 { 0x0690, 0 }, /* 0x0690 */ | |
708 { 0xFB8C, 1 }, /* 0x0691 R RREH */ | |
709 { 0x0692, 0 }, /* 0x0692 */ | |
710 { 0x0693, 0 }, /* 0x0693 */ | |
711 { 0x0694, 0 }, /* 0x0694 */ | |
712 { 0x0695, 0 }, /* 0x0695 */ | |
713 { 0x0696, 0 }, /* 0x0696 */ | |
714 { 0x0697, 0 }, /* 0x0697 */ | |
715 { 0xFB8A, 1 }, /* 0x0698 R JEH */ | |
716 { 0x0699, 0 }, /* 0x0699 */ | |
717 { 0x069A, 0 }, /* 0x069A */ | |
718 { 0x069B, 0 }, /* 0x069B */ | |
719 { 0x069C, 0 }, /* 0x069C */ | |
720 { 0x069D, 0 }, /* 0x069D */ | |
721 { 0x069E, 0 }, /* 0x069E */ | |
722 { 0x069F, 0 }, /* 0x069F */ | |
723 | |
724 { 0x06A0, 0 }, /* 0x06A0 */ | |
725 { 0x06A1, 0 }, /* 0x06A1 */ | |
726 { 0x06A2, 0 }, /* 0x06A2 */ | |
727 { 0x06A3, 0 }, /* 0x06A3 */ | |
728 { 0xFB6A, 3 }, /* 0x06A4 D VEH */ | |
729 { 0x06A5, 0 }, /* 0x06A5 */ | |
730 { 0xFB6E, 3 }, /* 0x06A6 D PEHEH */ | |
731 { 0x06A7, 0 }, /* 0x06A7 */ | |
732 { 0x06A8, 0 }, /* 0x06A8 */ | |
733 { 0xFB8E, 3 }, /* 0x06A9 D KEHEH */ | |
734 { 0x06AA, 0 }, /* 0x06AA */ | |
735 { 0x06AB, 0 }, /* 0x06AB */ | |
736 { 0x06AC, 0 }, /* 0x06AC */ | |
737 { 0xFBD3, 3 }, /* 0x06AD D NG */ | |
738 { 0x06AE, 0 }, /* 0x06AE */ | |
739 { 0xFB92, 3 }, /* 0x06AF D GAF */ | |
740 | |
741 { 0x06B0, 0 }, /* 0x06B0 */ | |
742 { 0xFB9A, 3 }, /* 0x06B1 D NGOEH */ | |
743 { 0x06B2, 0 }, /* 0x06B2 */ | |
744 { 0xFB96, 3 }, /* 0x06B3 D GUEH */ | |
745 { 0x06B4, 0 }, /* 0x06B4 */ | |
746 { 0x06B5, 0 }, /* 0x06B5 */ | |
747 { 0x06B6, 0 }, /* 0x06B6 */ | |
748 { 0x06B7, 0 }, /* 0x06B7 */ | |
749 { 0x06B8, 0 }, /* 0x06B8 */ | |
750 { 0x06B9, 0 }, /* 0x06B9 */ | |
751 { 0xFB9E, 1 }, /* 0x06BA R NOON GHUNNA */ | |
752 { 0xFBA0, 3 }, /* 0x06BB D RNOON */ | |
753 { 0x06BC, 0 }, /* 0x06BC */ | |
754 { 0x06BD, 0 }, /* 0x06BD */ | |
755 { 0xFBAA, 3 }, /* 0x06BE D HEH DOACHASHMEE */ | |
756 { 0x06BF, 0 }, /* 0x06BF */ | |
757 | |
758 { 0xFBA4, 1 }, /* 0x06C0 R HEH WITH YEH ABOVE */ | |
759 { 0xFBA6, 3 }, /* 0x06C1 D HEH GOAL */ | |
760 { 0x06C2, 0 }, /* 0x06C2 */ | |
761 { 0x06C3, 0 }, /* 0x06C3 */ | |
762 { 0x06C4, 0 }, /* 0x06C4 */ | |
763 { 0xFBE0, 1 }, /* 0x06C5 R KIRGHIZ OE */ | |
764 { 0xFBD9, 1 }, /* 0x06C6 R OE */ | |
765 { 0xFBD7, 1 }, /* 0x06C7 R U */ | |
766 { 0xFBDB, 1 }, /* 0x06C8 R YU */ | |
767 { 0xFBE2, 1 }, /* 0x06C9 R KIRGHIZ YU */ | |
768 { 0x06CA, 0 }, /* 0x06CA */ | |
769 { 0xFBDE, 1 }, /* 0x06CB R VE */ | |
770 { 0xFBFC, 3 }, /* 0x06CC D FARSI YEH */ | |
771 { 0x06CD, 0 }, /* 0x06CD */ | |
772 { 0x06CE, 0 }, /* 0x06CE */ | |
773 { 0x06CF, 0 }, /* 0x06CF */ | |
774 | |
775 { 0xFBE4, 3 }, /* 0x06D0 D E */ | |
776 { 0x06D1, 0 }, /* 0x06D1 */ | |
777 { 0xFBAE, 1 }, /* 0x06D2 R YEH BARREE */ | |
778 { 0xFBB0, 1 }, /* 0x06D3 R YEH BARREE WITH HAMZA ABOVE */ | |
779 { 0x06D4, 0 }, /* 0x06D4 */ | |
780 { 0x06D5, 0 }, /* 0x06D5 */ | |
781 { 0x06D6, 0 }, /* 0x06D6 */ | |
782 { 0x06D7, 0 }, /* 0x06D7 */ | |
783 { 0x06D8, 0 }, /* 0x06D8 */ | |
784 { 0x06D9, 0 }, /* 0x06D9 */ | |
785 { 0x06DA, 0 }, /* 0x06DA */ | |
786 { 0x06DB, 0 }, /* 0x06DB */ | |
787 { 0x06DC, 0 }, /* 0x06DC */ | |
788 { 0x06DD, 0 }, /* 0x06DD */ | |
789 { 0x06DE, 0 }, /* 0x06DE */ | |
790 { 0x06DF, 0 }, /* 0x06DF */ | |
791 | |
792 { 0x06E0, 0 }, /* 0x06E0 */ | |
793 { 0x06E1, 0 }, /* 0x06E1 */ | |
794 { 0x06E2, 0 }, /* 0x06E2 */ | |
795 { 0x06E3, 0 }, /* 0x06E3 */ | |
796 { 0x06E4, 0 }, /* 0x06E4 */ | |
797 { 0x06E5, 0 }, /* 0x06E5 */ | |
798 { 0x06E6, 0 }, /* 0x06E6 */ | |
799 { 0x06E7, 0 }, /* 0x06E7 */ | |
800 { 0x06E8, 0 }, /* 0x06E8 */ | |
801 { 0x06E9, 0 }, /* 0x06E9 */ | |
802 { 0x06EA, 0 }, /* 0x06EA */ | |
803 { 0x06EB, 0 }, /* 0x06EB */ | |
804 { 0x06EC, 0 }, /* 0x06EC */ | |
805 { 0x06ED, 0 }, /* 0x06ED */ | |
806 { 0x06EE, 0 }, /* 0x06EE */ | |
807 { 0x06EF, 0 }, /* 0x06EF */ | |
808 | |
809 { 0x06F0, 0 }, /* 0x06F0 */ | |
810 { 0x06F1, 0 }, /* 0x06F1 */ | |
811 { 0x06F2, 0 }, /* 0x06F2 */ | |
812 { 0x06F3, 0 }, /* 0x06F3 */ | |
813 { 0x06F4, 0 }, /* 0x06F4 */ | |
814 { 0x06F5, 0 }, /* 0x06F5 */ | |
815 { 0x06F6, 0 }, /* 0x06F6 */ | |
816 { 0x06F7, 0 }, /* 0x06F7 */ | |
817 { 0x06F8, 0 }, /* 0x06F8 */ | |
818 { 0x06F9, 0 }, /* 0x06F9 */ | |
819 { 0x06FA, 0 }, /* 0x06FA */ | |
820 { 0x06FB, 0 }, /* 0x06FB */ | |
821 { 0x06FC, 0 }, /* 0x06FC */ | |
822 { 0x06FD, 0 }, /* 0x06FD */ | |
823 { 0x06FE, 0 }, /* 0x06FE */ | |
824 { 0x06FF, 0 } /* 0x06FF */ | |
825 }; | |
826 | |
827 /* the arabicUnicodeMapping does not work for U+0649 ALEF MAKSURA, this table do
es */ | |
828 static const hb_uint16 alefMaksura[4] = {0xFEEF, 0xFEF0, 0xFBE8, 0xFBE9}; | |
829 | |
830 /* | |
831 // this is a bit tricky. Alef always binds to the right, so the second parameter
descibing the shape | |
832 // of the lam can be either initial of medial. So initial maps to the isolated f
orm of the ligature, | |
833 // medial to the final form | |
834 */ | |
835 static const hb_uint16 arabicUnicodeLamAlefMapping[6][4] = { | |
836 { 0xfffd, 0xfffd, 0xfef5, 0xfef6 }, /* 0x622 R Alef with Madda
above */ | |
837 { 0xfffd, 0xfffd, 0xfef7, 0xfef8 }, /* 0x623 R Alef with Hamza
above */ | |
838 { 0xfffd, 0xfffd, 0xfffd, 0xfffd }, /* 0x624 // Just to fill the tabl
e ;-) */ | |
839 { 0xfffd, 0xfffd, 0xfef9, 0xfefa }, /* 0x625 R Alef with Hamza
below */ | |
840 { 0xfffd, 0xfffd, 0xfffd, 0xfffd }, /* 0x626 // Just to fill the tabl
e ;-) */ | |
841 { 0xfffd, 0xfffd, 0xfefb, 0xfefc } /* 0x627 R Alef */ | |
842 }; | |
843 | |
844 static int getShape(hb_uint8 cell, int shape) | |
845 { | |
846 /* the arabicUnicodeMapping does not work for U+0649 ALEF MAKSURA, handle th
is here */ | |
847 int ch = (cell != 0x49) | |
848 ? (shape ? arabicUnicodeMapping[cell][0] + shape : 0x600+cell) | |
849 : alefMaksura[shape] ; | |
850 return ch; | |
851 } | |
852 | |
853 | |
854 /* | |
855 Two small helper functions for arabic shaping. | |
856 */ | |
857 static HB_UChar16 prevChar(const HB_UChar16 *str, int pos) | |
858 { | |
859 /*qDebug("leftChar: pos=%d", pos); */ | |
860 const HB_UChar16 *ch = str + pos - 1; | |
861 pos--; | |
862 while(pos > -1) { | |
863 if(HB_GetUnicodeCharCategory(*ch) != HB_Mark_NonSpacing) | |
864 return *ch; | |
865 pos--; | |
866 ch--; | |
867 } | |
868 return ReplacementCharacter; | |
869 } | |
870 | |
871 static HB_UChar16 nextChar(const HB_UChar16 *str, hb_uint32 len, hb_uint32 pos) | |
872 { | |
873 const HB_UChar16 *ch = str + pos + 1; | |
874 pos++; | |
875 while(pos < len) { | |
876 /*qDebug("rightChar: %d isLetter=%d, joining=%d", pos, ch.isLetter(), ch
.joining()); */ | |
877 if(HB_GetUnicodeCharCategory(*ch) != HB_Mark_NonSpacing) | |
878 return *ch; | |
879 /* assume it's a transparent char, this might not be 100% correct */ | |
880 pos++; | |
881 ch++; | |
882 } | |
883 return ReplacementCharacter; | |
884 } | |
885 | |
886 static void shapedString(const HB_UChar16 *uc, hb_uint32 stringLength, hb_uint32
from, hb_uint32 len, HB_UChar16 *shapeBuffer, int *shapedLength, | |
887 HB_Bool reverse, HB_GlyphAttributes *attributes, unsign
ed short *logClusters) | |
888 { | |
889 HB_ArabicProperties *properties; | |
890 hb_int32 f = from; | |
891 hb_uint32 l = len; | |
892 const HB_UChar16 *ch; | |
893 HB_UChar16 *data; | |
894 int clusterStart; | |
895 hb_uint32 i; | |
896 HB_STACKARRAY(HB_ArabicProperties, props, len + 2); | |
897 properties = props; | |
898 | |
899 assert(stringLength >= from + len); | |
900 | |
901 if(len == 0) { | |
902 *shapedLength = 0; | |
903 return; | |
904 } | |
905 | |
906 if (from > 0) { | |
907 --f; | |
908 ++l; | |
909 ++properties; | |
910 } | |
911 if (f + l < stringLength) | |
912 ++l; | |
913 getArabicProperties(uc+f, l, props); | |
914 | |
915 ch = uc + from; | |
916 data = shapeBuffer; | |
917 clusterStart = 0; | |
918 | |
919 for (i = 0; i < len; i++) { | |
920 hb_uint8 r = *ch >> 8; | |
921 int gpos = data - shapeBuffer; | |
922 | |
923 if (r != 0x06) { | |
924 if (r == 0x20) { | |
925 if (*ch == 0x200c || *ch == 0x200d) | |
926 /* remove ZWJ and ZWNJ */ | |
927 goto skip; | |
928 } | |
929 if (reverse) | |
930 *data = HB_GetMirroredChar(*ch); | |
931 else | |
932 *data = *ch; | |
933 } else { | |
934 hb_uint8 c = *ch & 0xff; | |
935 int pos = i + from; | |
936 int shape = properties[i].shape; | |
937 /* qDebug("mapping U+%x to shape %d glyph=0x%x", ch->unicode(), shape
, getShape(c, shape)); */ | |
938 /* take care of lam-alef ligatures (lam right of alef) */ | |
939 hb_uint16 map; | |
940 switch (c) { | |
941 case 0x44: { /* lam */ | |
942 const HB_UChar16 pch = nextChar(uc, stringLength, pos); | |
943 if ((pch >> 8) == 0x06) { | |
944 switch (pch & 0xff) { | |
945 case 0x22: | |
946 case 0x23: | |
947 case 0x25: | |
948 case 0x27: | |
949 /* qDebug(" lam of lam-alef ligature"); */ | |
950 map = arabicUnicodeLamAlefMapping[(pch & 0xff) -
0x22][shape]; | |
951 goto next; | |
952 default: | |
953 break; | |
954 } | |
955 } | |
956 break; | |
957 } | |
958 case 0x22: /* alef with madda */ | |
959 case 0x23: /* alef with hamza above */ | |
960 case 0x25: /* alef with hamza below */ | |
961 case 0x27: /* alef */ | |
962 if (prevChar(uc, pos) == 0x0644) { | |
963 /* have a lam alef ligature */ | |
964 /*qDebug(" alef of lam-alef ligature"); */ | |
965 goto skip; | |
966 } | |
967 default: | |
968 break; | |
969 } | |
970 map = getShape(c, shape); | |
971 next: | |
972 *data = map; | |
973 } | |
974 /* ##### Fixme */ | |
975 /*glyphs[gpos].attributes.zeroWidth = zeroWidth; */ | |
976 if (HB_GetUnicodeCharCategory(*ch) == HB_Mark_NonSpacing) { | |
977 attributes[gpos].mark = TRUE; | |
978 /* qDebug("glyph %d (char %d) is mark!", gpos, i); */ | |
979 } else { | |
980 attributes[gpos].mark = FALSE; | |
981 clusterStart = data - shapeBuffer; | |
982 } | |
983 attributes[gpos].clusterStart = !attributes[gpos].mark; | |
984 attributes[gpos].combiningClass = HB_GetUnicodeCharCombiningClass(*ch); | |
985 attributes[gpos].justification = properties[i].justification; | |
986 /* qDebug("data[%d] = %x (from %x)", gpos, (uint)data->unicode(), ch->un
icode());*/ | |
987 data++; | |
988 skip: | |
989 ch++; | |
990 logClusters[i] = clusterStart; | |
991 } | |
992 *shapedLength = data - shapeBuffer; | |
993 | |
994 HB_FREE_STACKARRAY(props); | |
995 } | |
996 | |
997 #ifndef NO_OPENTYPE | |
998 | |
999 static const HB_OpenTypeFeature arabic_features[] = { | |
1000 { HB_MAKE_TAG('c', 'c', 'm', 'p'), CcmpProperty }, | |
1001 { HB_MAKE_TAG('i', 's', 'o', 'l'), IsolProperty }, | |
1002 { HB_MAKE_TAG('f', 'i', 'n', 'a'), FinaProperty }, | |
1003 { HB_MAKE_TAG('m', 'e', 'd', 'i'), MediProperty }, | |
1004 { HB_MAKE_TAG('i', 'n', 'i', 't'), InitProperty }, | |
1005 { HB_MAKE_TAG('r', 'l', 'i', 'g'), RligProperty }, | |
1006 { HB_MAKE_TAG('c', 'a', 'l', 't'), CaltProperty }, | |
1007 { HB_MAKE_TAG('l', 'i', 'g', 'a'), LigaProperty }, | |
1008 { HB_MAKE_TAG('d', 'l', 'i', 'g'), DligProperty }, | |
1009 { HB_MAKE_TAG('c', 's', 'w', 'h'), CswhProperty }, | |
1010 /* mset is used in old Win95 fonts that don't have a 'mark' positioning tabl
e. */ | |
1011 { HB_MAKE_TAG('m', 's', 'e', 't'), MsetProperty }, | |
1012 {0, 0} | |
1013 }; | |
1014 | |
1015 static const HB_OpenTypeFeature syriac_features[] = { | |
1016 { HB_MAKE_TAG('c', 'c', 'm', 'p'), CcmpProperty }, | |
1017 { HB_MAKE_TAG('i', 's', 'o', 'l'), IsolProperty }, | |
1018 { HB_MAKE_TAG('f', 'i', 'n', 'a'), FinaProperty }, | |
1019 { HB_MAKE_TAG('f', 'i', 'n', '2'), FinaProperty }, | |
1020 { HB_MAKE_TAG('f', 'i', 'n', '3'), FinaProperty }, | |
1021 { HB_MAKE_TAG('m', 'e', 'd', 'i'), MediProperty }, | |
1022 { HB_MAKE_TAG('m', 'e', 'd', '2'), MediProperty }, | |
1023 { HB_MAKE_TAG('i', 'n', 'i', 't'), InitProperty }, | |
1024 { HB_MAKE_TAG('r', 'l', 'i', 'g'), RligProperty }, | |
1025 { HB_MAKE_TAG('c', 'a', 'l', 't'), CaltProperty }, | |
1026 { HB_MAKE_TAG('l', 'i', 'g', 'a'), LigaProperty }, | |
1027 { HB_MAKE_TAG('d', 'l', 'i', 'g'), DligProperty }, | |
1028 {0, 0} | |
1029 }; | |
1030 | |
1031 static HB_Bool arabicSyriacOpenTypeShape(HB_ShaperItem *item, HB_Bool *ot_ok) | |
1032 { | |
1033 const HB_UChar16 *uc; | |
1034 const int nglyphs = item->num_glyphs; | |
1035 hb_int32 f; | |
1036 hb_uint32 l; | |
1037 HB_ArabicProperties *properties; | |
1038 HB_DECLARE_STACKARRAY(HB_ArabicProperties, props) | |
1039 HB_DECLARE_STACKARRAY(hb_uint32, apply) | |
1040 HB_Bool shaped; | |
1041 int i = 0; | |
1042 | |
1043 *ot_ok = TRUE; | |
1044 | |
1045 if (!HB_ConvertStringToGlyphIndices(item)) | |
1046 return FALSE; | |
1047 HB_HeuristicSetGlyphAttributes(item); | |
1048 | |
1049 HB_INIT_STACKARRAY(HB_ArabicProperties, props, item->item.length + 2); | |
1050 HB_INIT_STACKARRAY(hb_uint32, apply, item->num_glyphs); | |
1051 | |
1052 uc = item->string + item->item.pos; | |
1053 | |
1054 properties = props; | |
1055 f = 0; | |
1056 l = item->item.length; | |
1057 if (item->item.pos > 0) { | |
1058 --f; | |
1059 ++l; | |
1060 ++properties; | |
1061 } | |
1062 if (f + l + item->item.pos < item->stringLength) { | |
1063 ++l; | |
1064 } | |
1065 if (item->item.script == HB_Script_Nko) | |
1066 getNkoProperties(uc+f, l, props); | |
1067 else | |
1068 getArabicProperties(uc+f, l, props); | |
1069 | |
1070 for (i = 0; i < (int)item->num_glyphs; i++) { | |
1071 apply[i] = 0; | |
1072 | |
1073 if (properties[i].shape == XIsolated) | |
1074 apply[i] |= MediProperty|FinaProperty|InitProperty; | |
1075 else if (properties[i].shape == XMedial) | |
1076 apply[i] |= IsolProperty|FinaProperty|InitProperty; | |
1077 else if (properties[i].shape == XFinal) | |
1078 apply[i] |= IsolProperty|MediProperty|InitProperty; | |
1079 else if (properties[i].shape == XInitial) | |
1080 apply[i] |= IsolProperty|MediProperty|FinaProperty; | |
1081 | |
1082 item->attributes[i].justification = properties[i].justification; | |
1083 } | |
1084 | |
1085 HB_FREE_STACKARRAY(props); | |
1086 | |
1087 shaped = HB_OpenTypeShape(item, apply); | |
1088 | |
1089 HB_FREE_STACKARRAY(apply); | |
1090 | |
1091 if (!shaped) { | |
1092 *ot_ok = FALSE; | |
1093 return FALSE; | |
1094 } | |
1095 return HB_OpenTypePosition(item, nglyphs, /*doLogClusters*/TRUE); | |
1096 } | |
1097 | |
1098 #endif | |
1099 | |
1100 /* #### stil missing: identify invalid character combinations */ | |
1101 HB_Bool HB_ArabicShape(HB_ShaperItem *item) | |
1102 { | |
1103 int slen; | |
1104 HB_Bool haveGlyphs; | |
1105 HB_STACKARRAY(HB_UChar16, shapedChars, item->item.length); | |
1106 | |
1107 assert(item->item.script == HB_Script_Arabic || item->item.script == HB_Scri
pt_Syriac | |
1108 || item->item.script == HB_Script_Nko); | |
1109 | |
1110 item->shaperFlags |= HB_ShaperFlag_ForceMarksToZeroWidth; | |
1111 #ifndef NO_OPENTYPE | |
1112 | |
1113 if (HB_SelectScript(item, item->item.script == HB_Script_Arabic ? arabic_fea
tures : syriac_features)) { | |
1114 HB_Bool ot_ok; | |
1115 if (arabicSyriacOpenTypeShape(item, &ot_ok)) | |
1116 return TRUE; | |
1117 if (ot_ok) | |
1118 return FALSE; | |
1119 /* fall through to the non OT code*/ | |
1120 } | |
1121 #endif | |
1122 | |
1123 if (item->item.script != HB_Script_Arabic) | |
1124 return HB_BasicShape(item); | |
1125 | |
1126 shapedString(item->string, item->stringLength, item->item.pos, item->item.le
ngth, shapedChars, &slen, | |
1127 item->item.bidiLevel % 2, | |
1128 item->attributes, item->log_clusters); | |
1129 | |
1130 haveGlyphs = item->font->klass | |
1131 ->convertStringToGlyphIndices(item->font, | |
1132 shapedChars, slen, | |
1133 item->glyphs, &item->num_glyphs, | |
1134 item->item.bidiLevel % 2); | |
1135 | |
1136 HB_FREE_STACKARRAY(shapedChars); | |
1137 | |
1138 if (!haveGlyphs) | |
1139 return FALSE; | |
1140 | |
1141 HB_HeuristicPosition(item); | |
1142 return TRUE; | |
1143 } | |
1144 | |
1145 | |
OLD | NEW |