|
1 /* |
|
2 * |
|
3 * (C) Copyright IBM Corp. 1998-2004 - All Rights Reserved |
|
4 * |
|
5 */ |
|
6 |
|
7 #include "LETypes.h" |
|
8 #include "LEGlyphFilter.h" |
|
9 #include "OpenTypeTables.h" |
|
10 #include "LEGlyphStorage.h" |
|
11 #include "ThaiShaping.h" |
|
12 |
|
13 U_NAMESPACE_BEGIN |
|
14 |
|
15 enum { |
|
16 CH_SPACE = 0x0020, |
|
17 CH_YAMAKKAN = 0x0E4E, |
|
18 CH_MAI_HANAKAT = 0x0E31, |
|
19 CH_SARA_AA = 0x0E32, |
|
20 CH_SARA_AM = 0x0E33, |
|
21 CH_SARA_UEE = 0x0E37, |
|
22 CH_MAITAIKHU = 0x0E47, |
|
23 CH_NIKHAHIT = 0x0E4D, |
|
24 CH_SARA_U = 0x0E38, |
|
25 CH_PHINTHU = 0x0E3A, |
|
26 CH_YO_YING = 0x0E0D, |
|
27 CH_THO_THAN = 0x0E10, |
|
28 CH_DOTTED_CIRCLE = 0x25CC |
|
29 }; |
|
30 |
|
31 le_uint8 ThaiShaping::getCharClass(LEUnicode ch) |
|
32 { |
|
33 le_uint8 charClass = NON; |
|
34 |
|
35 if (ch >= 0x0E00 && ch <= 0x0E5B) { |
|
36 charClass = classTable[ch - 0x0E00]; |
|
37 } |
|
38 |
|
39 return charClass; |
|
40 } |
|
41 |
|
42 |
|
43 LEUnicode ThaiShaping::leftAboveVowel(LEUnicode vowel, le_uint8 glyphSet) |
|
44 { |
|
45 static const LEUnicode leftAboveVowels[][7] = { |
|
46 {0x0E61, 0x0E32, 0x0E33, 0x0E64, 0x0E65, 0x0E66, 0x0E67}, |
|
47 {0xF710, 0x0E32, 0x0E33, 0xF701, 0xF702, 0xF703, 0xF704}, |
|
48 {0xF884, 0x0E32, 0x0E33, 0xF885, 0xF886, 0xF887, 0xF788}, |
|
49 {0x0E31, 0x0E32, 0x0E33, 0x0E34, 0x0E35, 0x0E36, 0x0E37} |
|
50 }; |
|
51 |
|
52 if (vowel >= CH_MAI_HANAKAT && vowel <= CH_SARA_UEE) { |
|
53 return leftAboveVowels[glyphSet][vowel - CH_MAI_HANAKAT]; |
|
54 } |
|
55 |
|
56 if (vowel == CH_YAMAKKAN && glyphSet == 0) { |
|
57 return 0x0E7E; |
|
58 } |
|
59 |
|
60 return vowel; |
|
61 } |
|
62 |
|
63 LEUnicode ThaiShaping::lowerRightTone(LEUnicode tone, le_uint8 glyphSet) |
|
64 { |
|
65 static const LEUnicode lowerRightTones[][7] = { |
|
66 {0x0E68, 0x0E69, 0x0E6A, 0x0E6B, 0x0E6C, 0x0E6D, 0x0E6E}, |
|
67 {0x0E47, 0xF70A, 0xF70B, 0xF70C, 0xF70D, 0xF70E, 0x0E4D}, |
|
68 {0x0E47, 0xF88B, 0xF88E, 0xF891, 0xF894, 0xF897, 0x0E4D}, |
|
69 {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D} |
|
70 }; |
|
71 |
|
72 if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) { |
|
73 return lowerRightTones[glyphSet][tone - CH_MAITAIKHU]; |
|
74 } |
|
75 |
|
76 return tone; |
|
77 } |
|
78 |
|
79 LEUnicode ThaiShaping::lowerLeftTone(LEUnicode tone, le_uint8 glyphSet) |
|
80 { |
|
81 static const LEUnicode lowerLeftTones[][7] = { |
|
82 {0x0E76, 0x0E77, 0x0E78, 0x0E79, 0x0E7A, 0x0E7B, 0x0E7C}, |
|
83 {0xF712, 0xF705, 0xF706, 0xF707, 0xF708, 0xF709, 0xF711}, |
|
84 {0xF889, 0xF88C, 0xF88F, 0xF892, 0xF895, 0xF898, 0xF899}, |
|
85 {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D} |
|
86 }; |
|
87 |
|
88 if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) { |
|
89 return lowerLeftTones[glyphSet][tone - CH_MAITAIKHU]; |
|
90 } |
|
91 |
|
92 return tone; |
|
93 } |
|
94 |
|
95 LEUnicode ThaiShaping::upperLeftTone(LEUnicode tone, le_uint8 glyphSet) |
|
96 { |
|
97 static const LEUnicode upperLeftTones[][7] = { |
|
98 {0x0E6F, 0x0E70, 0x0E71, 0x0E72, 0x0E73, 0x0E74, 0x0E75}, |
|
99 {0xF712, 0xF713, 0xF714, 0xF715, 0xF716, 0xF717, 0xF711}, |
|
100 {0xF889, 0xF88A, 0xF88D, 0xF890, 0xF893, 0xF896, 0xF899}, |
|
101 {0x0E47, 0x0E48, 0x0E49, 0x0E4A, 0x0E4B, 0x0E4C, 0x0E4D} |
|
102 }; |
|
103 |
|
104 if (tone >= CH_MAITAIKHU && tone <= CH_NIKHAHIT) { |
|
105 return upperLeftTones[glyphSet][tone - CH_MAITAIKHU]; |
|
106 } |
|
107 |
|
108 return tone; |
|
109 } |
|
110 |
|
111 LEUnicode ThaiShaping::lowerBelowVowel(LEUnicode vowel, le_uint8 glyphSet) |
|
112 { |
|
113 static const LEUnicode lowerBelowVowels[][3] = { |
|
114 {0x0E3C, 0x0E3D, 0x0E3E}, |
|
115 {0xF718, 0xF719, 0xF71A}, |
|
116 {0x0E38, 0x0E39, 0x0E3A}, |
|
117 {0x0E38, 0x0E39, 0x0E3A} |
|
118 |
|
119 }; |
|
120 |
|
121 if (vowel >= CH_SARA_U && vowel <= CH_PHINTHU) { |
|
122 return lowerBelowVowels[glyphSet][vowel - CH_SARA_U]; |
|
123 } |
|
124 |
|
125 return vowel; |
|
126 } |
|
127 |
|
128 LEUnicode ThaiShaping::noDescenderCOD(LEUnicode cod, le_uint8 glyphSet) |
|
129 { |
|
130 static const LEUnicode noDescenderCODs[][4] = { |
|
131 {0x0E60, 0x0E0E, 0x0E0F, 0x0E63}, |
|
132 {0xF70F, 0x0E0E, 0x0E0F, 0xF700}, |
|
133 {0x0E0D, 0x0E0E, 0x0E0F, 0x0E10}, |
|
134 {0x0E0D, 0x0E0E, 0x0E0F, 0x0E10} |
|
135 |
|
136 }; |
|
137 |
|
138 if (cod >= CH_YO_YING && cod <= CH_THO_THAN) { |
|
139 return noDescenderCODs[glyphSet][cod - CH_YO_YING]; |
|
140 } |
|
141 |
|
142 return cod; |
|
143 } |
|
144 |
|
145 le_uint8 ThaiShaping::doTransition (StateTransition transition, LEUnicode currChar, le_int32 inputIndex, le_uint8 glyphSet, |
|
146 LEUnicode errorChar, LEUnicode *outputBuffer, LEGlyphStorage &glyphStorage, le_int32 &outputIndex) |
|
147 { |
|
148 LEErrorCode success = LE_NO_ERROR; |
|
149 |
|
150 switch (transition.action) { |
|
151 case tA: |
|
152 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
153 outputBuffer[outputIndex++] = currChar; |
|
154 break; |
|
155 |
|
156 case tC: |
|
157 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
158 outputBuffer[outputIndex++] = currChar; |
|
159 break; |
|
160 |
|
161 case tD: |
|
162 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
163 outputBuffer[outputIndex++] = leftAboveVowel(currChar, glyphSet); |
|
164 break; |
|
165 |
|
166 case tE: |
|
167 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
168 outputBuffer[outputIndex++] = lowerRightTone(currChar, glyphSet); |
|
169 break; |
|
170 |
|
171 case tF: |
|
172 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
173 outputBuffer[outputIndex++] = lowerLeftTone(currChar, glyphSet); |
|
174 break; |
|
175 |
|
176 case tG: |
|
177 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
178 outputBuffer[outputIndex++] = upperLeftTone(currChar, glyphSet); |
|
179 break; |
|
180 |
|
181 case tH: |
|
182 { |
|
183 LEUnicode cod = outputBuffer[outputIndex - 1]; |
|
184 LEUnicode coa = noDescenderCOD(cod, glyphSet); |
|
185 |
|
186 if (cod != coa) { |
|
187 outputBuffer[outputIndex - 1] = coa; |
|
188 |
|
189 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
190 outputBuffer[outputIndex++] = currChar; |
|
191 break; |
|
192 } |
|
193 |
|
194 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
195 outputBuffer[outputIndex++] = lowerBelowVowel(currChar, glyphSet); |
|
196 break; |
|
197 } |
|
198 |
|
199 case tR: |
|
200 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
201 outputBuffer[outputIndex++] = errorChar; |
|
202 |
|
203 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
204 outputBuffer[outputIndex++] = currChar; |
|
205 break; |
|
206 |
|
207 case tS: |
|
208 if (currChar == CH_SARA_AM) { |
|
209 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
210 outputBuffer[outputIndex++] = errorChar; |
|
211 } |
|
212 |
|
213 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
214 outputBuffer[outputIndex++] = currChar; |
|
215 break; |
|
216 |
|
217 default: |
|
218 // FIXME: if we get here, there's an error |
|
219 // in the state table! |
|
220 glyphStorage.setCharIndex(outputIndex, inputIndex, success); |
|
221 outputBuffer[outputIndex++] = currChar; |
|
222 break; |
|
223 } |
|
224 |
|
225 return transition.nextState; |
|
226 } |
|
227 |
|
228 le_uint8 ThaiShaping::getNextState(LEUnicode ch, le_uint8 prevState, le_int32 inputIndex, le_uint8 glyphSet, LEUnicode errorChar, |
|
229 le_uint8 &charClass, LEUnicode *output, LEGlyphStorage &glyphStorage, le_int32 &outputIndex) |
|
230 { |
|
231 StateTransition transition; |
|
232 |
|
233 charClass = getCharClass(ch); |
|
234 transition = getTransition(prevState, charClass); |
|
235 |
|
236 return doTransition(transition, ch, inputIndex, glyphSet, errorChar, output, glyphStorage, outputIndex); |
|
237 } |
|
238 |
|
239 le_bool ThaiShaping::isLegalHere(LEUnicode ch, le_uint8 prevState) |
|
240 { |
|
241 le_uint8 charClass = getCharClass(ch); |
|
242 StateTransition transition = getTransition(prevState, charClass); |
|
243 |
|
244 switch (transition.action) { |
|
245 case tA: |
|
246 case tC: |
|
247 case tD: |
|
248 case tE: |
|
249 case tF: |
|
250 case tG: |
|
251 case tH: |
|
252 return TRUE; |
|
253 |
|
254 case tR: |
|
255 case tS: |
|
256 return FALSE; |
|
257 |
|
258 default: |
|
259 // FIXME: if we get here, there's an error |
|
260 // in the state table! |
|
261 return FALSE; |
|
262 } |
|
263 } |
|
264 |
|
265 le_int32 ThaiShaping::compose(const LEUnicode *input, le_int32 offset, le_int32 charCount, le_uint8 glyphSet, |
|
266 LEUnicode errorChar, LEUnicode *output, LEGlyphStorage &glyphStorage) |
|
267 { |
|
268 le_uint8 state = 0; |
|
269 le_int32 inputIndex; |
|
270 le_int32 outputIndex = 0; |
|
271 le_uint8 conState = 0xFF; |
|
272 le_int32 conInput = -1; |
|
273 le_int32 conOutput = -1; |
|
274 |
|
275 for (inputIndex = 0; inputIndex < charCount; inputIndex += 1) { |
|
276 LEUnicode ch = input[inputIndex + offset]; |
|
277 le_uint8 charClass; |
|
278 |
|
279 // Decompose SARA AM into NIKHAHIT + SARA AA |
|
280 if (ch == CH_SARA_AM && isLegalHere(ch, state)) { |
|
281 outputIndex = conOutput; |
|
282 state = getNextState(CH_NIKHAHIT, conState, inputIndex, glyphSet, errorChar, charClass, |
|
283 output, glyphStorage, outputIndex); |
|
284 |
|
285 for (int j = conInput + 1; j < inputIndex; j += 1) { |
|
286 ch = input[j + offset]; |
|
287 state = getNextState(ch, state, j, glyphSet, errorChar, charClass, |
|
288 output, glyphStorage, outputIndex); |
|
289 } |
|
290 |
|
291 ch = CH_SARA_AA; |
|
292 } |
|
293 |
|
294 state = getNextState(ch, state, inputIndex, glyphSet, errorChar, charClass, |
|
295 output, glyphStorage, outputIndex); |
|
296 |
|
297 if (charClass >= CON && charClass <= COD) { |
|
298 conState = state; |
|
299 conInput = inputIndex; |
|
300 conOutput = outputIndex; |
|
301 } |
|
302 } |
|
303 |
|
304 return outputIndex; |
|
305 } |
|
306 |
|
307 U_NAMESPACE_END |