1 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> |
|
2 <html xmlns="http://www.w3.org/1999/xhtml"> |
|
3 <head> |
|
4 <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> |
|
5 <title>TB9.2 Example Applications: examples/PIPS/antiword/src/chartrans.c Source File</title> |
|
6 <link href="tabs.css" rel="stylesheet" type="text/css"/> |
|
7 <link href="doxygen.css" rel="stylesheet" type="text/css"/> |
|
8 </head> |
|
9 <body> |
|
10 <!-- Generated by Doxygen 1.6.2 --> |
|
11 <h1>examples/PIPS/antiword/src/chartrans.c</h1><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/*</span> |
|
12 <a name="l00002"></a>00002 <span class="comment"> * chartrans.c</span> |
|
13 <a name="l00003"></a>00003 <span class="comment"> * Copyright (C) 1999-2004 A.J. van Os; Released under GNU GPL</span> |
|
14 <a name="l00004"></a>00004 <span class="comment"> *</span> |
|
15 <a name="l00005"></a>00005 <span class="comment"> * Description:</span> |
|
16 <a name="l00006"></a>00006 <span class="comment"> * Translate Word characters to local representation</span> |
|
17 <a name="l00007"></a>00007 <span class="comment"> */</span> |
|
18 <a name="l00008"></a>00008 |
|
19 <a name="l00009"></a>00009 <span class="preprocessor">#include <stdlib.h></span> |
|
20 <a name="l00010"></a>00010 <span class="preprocessor">#include <string.h></span> |
|
21 <a name="l00011"></a>00011 <span class="preprocessor">#include <ctype.h></span> |
|
22 <a name="l00012"></a>00012 <span class="preprocessor">#if defined(__STDC_ISO_10646__)</span> |
|
23 <a name="l00013"></a>00013 <span class="preprocessor"></span><span class="preprocessor">#include <wctype.h></span> |
|
24 <a name="l00014"></a>00014 <span class="preprocessor">#endif </span><span class="comment">/* __STDC_ISO_10646__ */</span> |
|
25 <a name="l00015"></a>00015 <span class="preprocessor">#include "antiword.h"</span> |
|
26 <a name="l00016"></a>00016 |
|
27 <a name="l00017"></a>00017 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usCp850[] = { <span class="comment">/* DOS implementation of Latin1 */</span> |
|
28 <a name="l00018"></a>00018 0x00c7, 0x00fc, 0x00e9, 0x00e2, 0x00e4, 0x00e0, 0x00e5, 0x00e7, |
|
29 <a name="l00019"></a>00019 0x00ea, 0x00eb, 0x00e8, 0x00ef, 0x00ee, 0x00ec, 0x00c4, 0x00c5, |
|
30 <a name="l00020"></a>00020 0x00c9, 0x00e6, 0x00c6, 0x00f4, 0x00f6, 0x00f2, 0x00fb, 0x00f9, |
|
31 <a name="l00021"></a>00021 0x00ff, 0x00d6, 0x00dc, 0x00f8, 0x00a3, 0x00d8, 0x00d7, 0x0192, |
|
32 <a name="l00022"></a>00022 0x00e1, 0x00ed, 0x00f3, 0x00fa, 0x00f1, 0x00d1, 0x00aa, 0x00ba, |
|
33 <a name="l00023"></a>00023 0x00bf, 0x00ae, 0x00ac, 0x00bd, 0x00bc, 0x00a1, 0x00ab, 0x00bb, |
|
34 <a name="l00024"></a>00024 0x2591, 0x2592, 0x2593, 0x2502, 0x2524, 0x00c1, 0x00c2, 0x00c0, |
|
35 <a name="l00025"></a>00025 0x00a9, 0x2563, 0x2551, 0x2557, 0x255d, 0x00a2, 0x00a5, 0x2510, |
|
36 <a name="l00026"></a>00026 0x2514, 0x2534, 0x252c, 0x251c, 0x2500, 0x253c, 0x00e3, 0x00c3, |
|
37 <a name="l00027"></a>00027 0x255a, 0x2554, 0x2569, 0x2566, 0x2560, 0x2550, 0x256c, 0x00a4, |
|
38 <a name="l00028"></a>00028 0x00f0, 0x00d0, 0x00ca, 0x00cb, 0x00c8, 0x0131, 0x00cd, 0x00ce, |
|
39 <a name="l00029"></a>00029 0x00cf, 0x2518, 0x250c, 0x2588, 0x2584, 0x00a6, 0x00cc, 0x2580, |
|
40 <a name="l00030"></a>00030 0x00d3, 0x00df, 0x00d4, 0x00d2, 0x00f5, 0x00d5, 0x00b5, 0x00fe, |
|
41 <a name="l00031"></a>00031 0x00de, 0x00da, 0x00db, 0x00d9, 0x00fd, 0x00dd, 0x00af, 0x00b4, |
|
42 <a name="l00032"></a>00032 0x00ad, 0x00b1, 0x2017, 0x00be, 0x00b6, 0x00a7, 0x00f7, 0x00b8, |
|
43 <a name="l00033"></a>00033 0x00b0, 0x00a8, 0x00b7, 0x00b9, 0x00b3, 0x00b2, 0x25a0, 0x00a0, |
|
44 <a name="l00034"></a>00034 }; |
|
45 <a name="l00035"></a>00035 |
|
46 <a name="l00036"></a>00036 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usCp1250[] = { <span class="comment">/* Windows implementation of Latin2 */</span> |
|
47 <a name="l00037"></a>00037 0x20ac, 0x003f, 0x201a, 0x003f, 0x201e, 0x2026, 0x2020, 0x2021, |
|
48 <a name="l00038"></a>00038 0x003f, 0x2030, 0x0160, 0x2039, 0x015a, 0x0164, 0x017d, 0x0179, |
|
49 <a name="l00039"></a>00039 0x003f, 0x2018, 0x2019, 0x201c, 0x201d, 0x2022, 0x2013, 0x2014, |
|
50 <a name="l00040"></a>00040 0x003f, 0x2122, 0x0161, 0x203a, 0x015b, 0x0165, 0x017e, 0x017a, |
|
51 <a name="l00041"></a>00041 0x00a0, 0x02c7, 0x02d8, 0x0141, 0x00a4, 0x0104, 0x00a6, 0x00a7, |
|
52 <a name="l00042"></a>00042 0x00a8, 0x00a9, 0x015e, 0x00ab, 0x00ac, 0x00ad, 0x00ae, 0x017b, |
|
53 <a name="l00043"></a>00043 0x00b0, 0x00b1, 0x02db, 0x0142, 0x00b4, 0x00b5, 0x00b6, 0x00b7, |
|
54 <a name="l00044"></a>00044 0x00b8, 0x0105, 0x015f, 0x00bb, 0x013d, 0x02dd, 0x013e, 0x017c, |
|
55 <a name="l00045"></a>00045 0x0154, 0x00c1, 0x00c2, 0x0102, 0x00c4, 0x0139, 0x0106, 0x00c7, |
|
56 <a name="l00046"></a>00046 0x010c, 0x00c9, 0x0118, 0x00cb, 0x011a, 0x00cd, 0x00ce, 0x010e, |
|
57 <a name="l00047"></a>00047 0x0110, 0x0143, 0x0147, 0x00d3, 0x00d4, 0x0150, 0x00d6, 0x00d7, |
|
58 <a name="l00048"></a>00048 0x0158, 0x016e, 0x00da, 0x0170, 0x00dc, 0x00dd, 0x0162, 0x00df, |
|
59 <a name="l00049"></a>00049 0x0155, 0x00e1, 0x00e2, 0x0103, 0x00e4, 0x013a, 0x0107, 0x00e7, |
|
60 <a name="l00050"></a>00050 0x010d, 0x00e9, 0x0119, 0x00eb, 0x011b, 0x00ed, 0x00ee, 0x010f, |
|
61 <a name="l00051"></a>00051 0x0111, 0x0144, 0x0148, 0x00f3, 0x00f4, 0x0151, 0x00f6, 0x00f7, |
|
62 <a name="l00052"></a>00052 0x0159, 0x016f, 0x00fa, 0x0171, 0x00fc, 0x00fd, 0x0163, 0x02d9, |
|
63 <a name="l00053"></a>00053 }; |
|
64 <a name="l00054"></a>00054 |
|
65 <a name="l00055"></a>00055 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usCp1251[] = { <span class="comment">/* Windows implementation of Cyrillic */</span> |
|
66 <a name="l00056"></a>00056 0x0402, 0x0403, 0x201a, 0x0453, 0x201e, 0x2026, 0x2020, 0x2021, |
|
67 <a name="l00057"></a>00057 0x20ac, 0x2030, 0x0409, 0x2039, 0x040a, 0x040c, 0x040b, 0x040f, |
|
68 <a name="l00058"></a>00058 0x0452, 0x2018, 0x2019, 0x201c, 0x201d, 0x2022, 0x2013, 0x2014, |
|
69 <a name="l00059"></a>00059 0x00f3, 0x2122, 0x0459, 0x203a, 0x045a, 0x045c, 0x045b, 0x045f, |
|
70 <a name="l00060"></a>00060 0x00a0, 0x040e, 0x045e, 0x0408, 0x00a4, 0x0490, 0x00a6, 0x00a7, |
|
71 <a name="l00061"></a>00061 0x0401, 0x00a9, 0x0404, 0x00ab, 0x00ac, 0x00ad, 0x00ae, 0x0407, |
|
72 <a name="l00062"></a>00062 0x00b0, 0x00b1, 0x0406, 0x0456, 0x0491, 0x00b5, 0x00b6, 0x00b7, |
|
73 <a name="l00063"></a>00063 0x0451, 0x2116, 0x0454, 0x00bb, 0x0458, 0x0405, 0x0455, 0x0457, |
|
74 <a name="l00064"></a>00064 0x0410, 0x0411, 0x0412, 0x0413, 0x0414, 0x0415, 0x0416, 0x0417, |
|
75 <a name="l00065"></a>00065 0x0418, 0x0419, 0x041a, 0x041b, 0x041c, 0x041d, 0x041e, 0x041f, |
|
76 <a name="l00066"></a>00066 0x0420, 0x0421, 0x0422, 0x0423, 0x0424, 0x0425, 0x0426, 0x0427, |
|
77 <a name="l00067"></a>00067 0x0428, 0x0429, 0x042a, 0x042b, 0x042c, 0x042d, 0x042e, 0x042f, |
|
78 <a name="l00068"></a>00068 0x0430, 0x0431, 0x0432, 0x0433, 0x0434, 0x0435, 0x0436, 0x0437, |
|
79 <a name="l00069"></a>00069 0x0438, 0x0439, 0x043a, 0x043b, 0x043c, 0x043d, 0x043e, 0x043f, |
|
80 <a name="l00070"></a>00070 0x0440, 0x0441, 0x0442, 0x0443, 0x0444, 0x0445, 0x0446, 0x0447, |
|
81 <a name="l00071"></a>00071 0x0448, 0x0449, 0x044a, 0x044b, 0x044c, 0x044d, 0x044e, 0x044f, |
|
82 <a name="l00072"></a>00072 }; |
|
83 <a name="l00073"></a>00073 |
|
84 <a name="l00074"></a>00074 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usCp1252[] = { <span class="comment">/* Windows implementation of Latin1 */</span> |
|
85 <a name="l00075"></a>00075 0x20ac, 0x003f, 0x201a, 0x0192, 0x201e, 0x2026, 0x2020, 0x2021, |
|
86 <a name="l00076"></a>00076 0x02c6, 0x2030, 0x0160, 0x2039, 0x0152, 0x003f, 0x017d, 0x003f, |
|
87 <a name="l00077"></a>00077 0x003f, 0x2018, 0x2019, 0x201c, 0x201d, 0x2022, 0x2013, 0x2014, |
|
88 <a name="l00078"></a>00078 0x02dc, 0x2122, 0x0161, 0x203a, 0x0153, 0x003f, 0x017e, 0x0178, |
|
89 <a name="l00079"></a>00079 0x00a0, 0x00a1, 0x00a2, 0x00a3, 0x00a4, 0x00a5, 0x00a6, 0x00a7, |
|
90 <a name="l00080"></a>00080 0x00a8, 0x00a9, 0x00aa, 0x00ab, 0x00ac, 0x00ad, 0x00ae, 0x00af, |
|
91 <a name="l00081"></a>00081 0x00b0, 0x00b1, 0x00b2, 0x00b3, 0x00b4, 0x00b5, 0x00b6, 0x00b7, |
|
92 <a name="l00082"></a>00082 0x00b8, 0x00b9, 0x00ba, 0x00bb, 0x00bc, 0x00bd, 0x00be, 0x00bf, |
|
93 <a name="l00083"></a>00083 0x00c0, 0x00c1, 0x00c2, 0x00c3, 0x00c4, 0x00c5, 0x00c6, 0x00c7, |
|
94 <a name="l00084"></a>00084 0x00c8, 0x00c9, 0x00ca, 0x00cb, 0x00cc, 0x00cd, 0x00ce, 0x00cf, |
|
95 <a name="l00085"></a>00085 0x00d0, 0x00d1, 0x00d2, 0x00d3, 0x00d4, 0x00d5, 0x00d6, 0x00d7, |
|
96 <a name="l00086"></a>00086 0x00d8, 0x00d9, 0x00da, 0x00db, 0x00dc, 0x00dd, 0x00de, 0x00df, |
|
97 <a name="l00087"></a>00087 0x00e0, 0x00e1, 0x00e2, 0x00e3, 0x00e4, 0x00e5, 0x00e6, 0x00e7, |
|
98 <a name="l00088"></a>00088 0x00e8, 0x00e9, 0x00ea, 0x00eb, 0x00ec, 0x00ed, 0x00ee, 0x00ef, |
|
99 <a name="l00089"></a>00089 0x00f0, 0x00f1, 0x00f2, 0x00f3, 0x00f4, 0x00f5, 0x00f6, 0x00f7, |
|
100 <a name="l00090"></a>00090 0x00f8, 0x00f9, 0x00fa, 0x00fb, 0x00fc, 0x00fd, 0x00fe, 0x00ff, |
|
101 <a name="l00091"></a>00091 }; |
|
102 <a name="l00092"></a>00092 |
|
103 <a name="l00093"></a>00093 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usMacRoman[] = { <span class="comment">/* Apple implementation of Latin1 */</span> |
|
104 <a name="l00094"></a>00094 0x00c4, 0x00c5, 0x00c7, 0x00c9, 0x00d1, 0x00d6, 0x00dc, 0x00e1, |
|
105 <a name="l00095"></a>00095 0x00e0, 0x00e2, 0x00e4, 0x00e3, 0x00e5, 0x00e7, 0x00e9, 0x00e8, |
|
106 <a name="l00096"></a>00096 0x00ea, 0x00eb, 0x00ed, 0x00ec, 0x00ee, 0x00ef, 0x00f1, 0x00f3, |
|
107 <a name="l00097"></a>00097 0x00f2, 0x00f4, 0x00f6, 0x00f5, 0x00fa, 0x00f9, 0x00fb, 0x00fc, |
|
108 <a name="l00098"></a>00098 0x2020, 0x00b0, 0x00a2, 0x00a3, 0x00a7, 0x2022, 0x00b6, 0x00df, |
|
109 <a name="l00099"></a>00099 0x00ae, 0x00a9, 0x2122, 0x00b4, 0x00a8, 0x2260, 0x00c6, 0x00d8, |
|
110 <a name="l00100"></a>00100 0x221e, 0x00b1, 0x2264, 0x2265, 0x00a5, 0x00b5, 0x2202, 0x2211, |
|
111 <a name="l00101"></a>00101 0x220f, 0x03c0, 0x222b, 0x00aa, 0x00ba, 0x2126, 0x00e6, 0x00f8, |
|
112 <a name="l00102"></a>00102 0x00bf, 0x00a1, 0x00ac, 0x221a, 0x0192, 0x2248, 0x2206, 0x00ab, |
|
113 <a name="l00103"></a>00103 0x00bb, 0x2026, 0x00a0, 0x00c0, 0x00c3, 0x00d5, 0x0152, 0x0153, |
|
114 <a name="l00104"></a>00104 0x2013, 0x2014, 0x201c, 0x201d, 0x2018, 0x2019, 0x00f7, 0x25ca, |
|
115 <a name="l00105"></a>00105 0x00ff, 0x0178, 0x2044, 0x00a4, 0x2039, 0x203a, 0xfb01, 0xfb02, |
|
116 <a name="l00106"></a>00106 0x2021, 0x00b7, 0x201a, 0x201e, 0x2030, 0x00c2, 0x00ca, 0x00c1, |
|
117 <a name="l00107"></a>00107 0x00cb, 0x00c8, 0x00cd, 0x00ce, 0x00cf, 0x00cc, 0x00d3, 0x00d4, |
|
118 <a name="l00108"></a>00108 0x003f, 0x00d2, 0x00da, 0x00db, 0x00d9, 0x0131, 0x02c6, 0x02dc, |
|
119 <a name="l00109"></a>00109 0x00af, 0x02d8, 0x02d9, 0x02da, 0x00b8, 0x02dd, 0x02db, 0x02c7, |
|
120 <a name="l00110"></a>00110 }; |
|
121 <a name="l00111"></a>00111 |
|
122 <a name="l00112"></a>00112 <span class="keyword">static</span> <span class="keyword">const</span> USHORT usPrivateArea[] = { |
|
123 <a name="l00113"></a>00113 0x0020, 0x0021, 0x2200, 0x0023, 0x2203, 0x0025, 0x0026, 0x220d, |
|
124 <a name="l00114"></a>00114 0x0028, 0x0029, 0x2217, 0x002b, 0x002c, 0x2212, 0x002e, 0x002f, |
|
125 <a name="l00115"></a>00115 0x0030, 0x0031, 0x0032, 0x0033, 0x0034, 0x0035, 0x0036, 0x0037, |
|
126 <a name="l00116"></a>00116 0x0038, 0x0039, 0x003a, 0x003b, 0x003c, 0x2019, 0x003e, 0x003f, |
|
127 <a name="l00117"></a>00117 0x201d, 0x201c, 0x0392, 0x03a7, 0x0394, 0x0395, 0x03a6, 0x0393, |
|
128 <a name="l00118"></a>00118 0x0397, 0x0399, 0x03d1, 0x039a, 0x039b, 0x039c, 0x039d, 0x039f, |
|
129 <a name="l00119"></a>00119 0x03a0, 0x0398, 0x03a1, 0x03a3, 0x03a4, 0x03a5, 0x03c2, 0x03a9, |
|
130 <a name="l00120"></a>00120 0x039e, 0x03a8, 0x0396, 0x005b, 0x2234, 0x005d, 0x22a5, 0x005f, |
|
131 <a name="l00121"></a>00121 0x003f, 0x03b1, 0x03b2, 0x03c7, 0x03b4, 0x03b5, 0x03c6, 0x03b3, |
|
132 <a name="l00122"></a>00122 0x03b7, 0x03b9, 0x03d5, 0x03ba, 0x03bb, 0x03bc, 0x03bd, 0x03bf, |
|
133 <a name="l00123"></a>00123 0x03c0, 0x03b8, 0x03c1, 0x03c3, 0x03c4, 0x03c5, 0x03d6, 0x03c9, |
|
134 <a name="l00124"></a>00124 0x03be, 0x03c8, 0x03b6, 0x007b, 0x007c, 0x007d, 0x223c, 0x003f, |
|
135 <a name="l00125"></a>00125 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, |
|
136 <a name="l00126"></a>00126 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, |
|
137 <a name="l00127"></a>00127 0x003f, 0x003f, 0x003f, 0x2022, 0x003f, 0x003f, 0x003f, 0x003f, |
|
138 <a name="l00128"></a>00128 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, 0x003f, |
|
139 <a name="l00129"></a>00129 0x20ac, 0x03d2, 0x2032, 0x2264, 0x2044, 0x221e, 0x0192, 0x2663, |
|
140 <a name="l00130"></a>00130 0x2666, 0x2665, 0x2660, 0x2194, 0x2190, 0x2191, 0x2192, 0x2193, |
|
141 <a name="l00131"></a>00131 0x00b0, 0x00b1, 0x2033, 0x2265, 0x00d7, 0x221d, 0x2202, 0x2022, |
|
142 <a name="l00132"></a>00132 0x00f7, 0x2260, 0x2261, 0x2248, 0x2026, 0x007c, 0x23af, 0x21b5, |
|
143 <a name="l00133"></a>00133 0x2135, 0x2111, 0x211c, 0x2118, 0x2297, 0x2295, 0x2205, 0x2229, |
|
144 <a name="l00134"></a>00134 0x222a, 0x2283, 0x2287, 0x2284, 0x2282, 0x2286, 0x2208, 0x2209, |
|
145 <a name="l00135"></a>00135 0x2220, 0x2207, 0x00ae, 0x00a9, 0x2122, 0x220f, 0x221a, 0x22c5, |
|
146 <a name="l00136"></a>00136 0x00ac, 0x2227, 0x2228, 0x21d4, 0x21d0, 0x21d1, 0x21d2, 0x21d3, |
|
147 <a name="l00137"></a>00137 0x22c4, 0x3008, 0x00ae, 0x00a9, 0x2122, 0x2211, 0x239b, 0x239c, |
|
148 <a name="l00138"></a>00138 0x239d, 0x23a1, 0x23a2, 0x23a3, 0x23a7, 0x23a8, 0x23a9, 0x23aa, |
|
149 <a name="l00139"></a>00139 0x003f, 0x3009, 0x222b, 0x2320, 0x23ae, 0x2321, 0x239e, 0x239f, |
|
150 <a name="l00140"></a>00140 0x23a0, 0x23a4, 0x23a5, 0x23a6, 0x23ab, 0x23ac, 0x23ad, 0x003f, |
|
151 <a name="l00141"></a>00141 }; |
|
152 <a name="l00142"></a>00142 |
|
153 <a name="l00143"></a>00143 <span class="keyword">typedef</span> <span class="keyword">struct </span>char_table_tag { |
|
154 <a name="l00144"></a>00144 UCHAR ucLocal; |
|
155 <a name="l00145"></a>00145 USHORT usUnicode; |
|
156 <a name="l00146"></a>00146 } char_table_type; |
|
157 <a name="l00147"></a>00147 |
|
158 <a name="l00148"></a>00148 <span class="keyword">static</span> char_table_type atCharTable[256]; |
|
159 <a name="l00149"></a>00149 <span class="keyword">static</span> <span class="keywordtype">size_t</span> tNextPosFree = 0; |
|
160 <a name="l00150"></a>00150 |
|
161 <a name="l00151"></a>00151 |
|
162 <a name="l00152"></a>00152 <span class="comment">/*</span> |
|
163 <a name="l00153"></a>00153 <span class="comment"> * iCompare - compare two records</span> |
|
164 <a name="l00154"></a>00154 <span class="comment"> *</span> |
|
165 <a name="l00155"></a>00155 <span class="comment"> * Compares two records. For use by qsort(3C) and bsearch(3C).</span> |
|
166 <a name="l00156"></a>00156 <span class="comment"> *</span> |
|
167 <a name="l00157"></a>00157 <span class="comment"> * returns -1 if rec1 < rec2, 0 if rec1 == rec2, 1 if rec1 > rec2</span> |
|
168 <a name="l00158"></a>00158 <span class="comment"> */</span> |
|
169 <a name="l00159"></a>00159 <span class="keyword">static</span> <span class="keywordtype">int</span> |
|
170 <a name="l00160"></a>00160 iCompare(<span class="keyword">const</span> <span class="keywordtype">void</span> *pvRecord1, <span class="keyword">const</span> <span class="keywordtype">void</span> *pvRecord2) |
|
171 <a name="l00161"></a>00161 { |
|
172 <a name="l00162"></a>00162 USHORT usUnicode1, usUnicode2; |
|
173 <a name="l00163"></a>00163 |
|
174 <a name="l00164"></a>00164 usUnicode1 = ((char_table_type *)pvRecord1)->usUnicode; |
|
175 <a name="l00165"></a>00165 usUnicode2 = ((char_table_type *)pvRecord2)->usUnicode; |
|
176 <a name="l00166"></a>00166 |
|
177 <a name="l00167"></a>00167 <span class="keywordflow">if</span> (usUnicode1 < usUnicode2) { |
|
178 <a name="l00168"></a>00168 <span class="keywordflow">return</span> -1; |
|
179 <a name="l00169"></a>00169 } |
|
180 <a name="l00170"></a>00170 <span class="keywordflow">if</span> (usUnicode1 > usUnicode2) { |
|
181 <a name="l00171"></a>00171 <span class="keywordflow">return</span> 1; |
|
182 <a name="l00172"></a>00172 } |
|
183 <a name="l00173"></a>00173 <span class="keywordflow">return</span> 0; |
|
184 <a name="l00174"></a>00174 } <span class="comment">/* end of iCompare */</span> |
|
185 <a name="l00175"></a>00175 |
|
186 <a name="l00176"></a>00176 <span class="comment">/*</span> |
|
187 <a name="l00177"></a>00177 <span class="comment"> * pGetCharTableRecord - get the character table record</span> |
|
188 <a name="l00178"></a>00178 <span class="comment"> *</span> |
|
189 <a name="l00179"></a>00179 <span class="comment"> * returns a pointer to the record when found, otherwise NULL</span> |
|
190 <a name="l00180"></a>00180 <span class="comment"> */</span> |
|
191 <a name="l00181"></a>00181 <span class="keyword">static</span> <span class="keyword">const</span> char_table_type * |
|
192 <a name="l00182"></a>00182 pGetCharTableRecord(USHORT usUnicode) |
|
193 <a name="l00183"></a>00183 { |
|
194 <a name="l00184"></a>00184 char_table_type tKey; |
|
195 <a name="l00185"></a>00185 |
|
196 <a name="l00186"></a>00186 <span class="keywordflow">if</span> (tNextPosFree == 0) { |
|
197 <a name="l00187"></a>00187 <span class="keywordflow">return</span> NULL; |
|
198 <a name="l00188"></a>00188 } |
|
199 <a name="l00189"></a>00189 tKey.usUnicode = usUnicode; |
|
200 <a name="l00190"></a>00190 tKey.ucLocal = 0; |
|
201 <a name="l00191"></a>00191 <span class="keywordflow">return</span> (char_table_type *)bsearch(&tKey, |
|
202 <a name="l00192"></a>00192 atCharTable, |
|
203 <a name="l00193"></a>00193 tNextPosFree, <span class="keyword">sizeof</span>(atCharTable[0]), |
|
204 <a name="l00194"></a>00194 iCompare); |
|
205 <a name="l00195"></a>00195 } <span class="comment">/* end of pGetCharTableRecord */</span> |
|
206 <a name="l00196"></a>00196 |
|
207 <a name="l00197"></a>00197 <span class="comment">/*</span> |
|
208 <a name="l00198"></a>00198 <span class="comment"> * ucGetBulletCharacter - get the local representation of the bullet</span> |
|
209 <a name="l00199"></a>00199 <span class="comment"> */</span> |
|
210 <a name="l00200"></a>00200 UCHAR |
|
211 <a name="l00201"></a>00201 ucGetBulletCharacter(conversion_type eConversionType, encoding_type eEncoding) |
|
212 <a name="l00202"></a>00202 { |
|
213 <a name="l00203"></a>00203 <span class="preprocessor">#if defined(__riscos)</span> |
|
214 <a name="l00204"></a>00204 <span class="preprocessor"></span> <span class="keywordflow">return</span> 0x8f; |
|
215 <a name="l00205"></a>00205 <span class="preprocessor">#else</span> |
|
216 <a name="l00206"></a>00206 <span class="preprocessor"></span> <span class="keyword">const</span> char_table_type *pRec; |
|
217 <a name="l00207"></a>00207 |
|
218 <a name="l00208"></a>00208 fail(eEncoding == encoding_utf_8); |
|
219 <a name="l00209"></a>00209 |
|
220 <a name="l00210"></a>00210 <span class="keywordflow">if</span> (eEncoding == encoding_latin_1 && |
|
221 <a name="l00211"></a>00211 (eConversionType == conversion_ps || |
|
222 <a name="l00212"></a>00212 eConversionType == conversion_pdf)) { |
|
223 <a name="l00213"></a>00213 <span class="comment">/* Ugly, but it makes the PostScript and PDF look better */</span> |
|
224 <a name="l00214"></a>00214 <span class="keywordflow">return</span> (UCHAR)143; |
|
225 <a name="l00215"></a>00215 } |
|
226 <a name="l00216"></a>00216 <span class="keywordflow">if</span> (eConversionType != conversion_text && |
|
227 <a name="l00217"></a>00217 eConversionType != conversion_fmt_text) { |
|
228 <a name="l00218"></a>00218 pRec = pGetCharTableRecord(UNICODE_BULLET); |
|
229 <a name="l00219"></a>00219 <span class="keywordflow">if</span> (pRec != NULL) { |
|
230 <a name="l00220"></a>00220 <span class="keywordflow">return</span> pRec->ucLocal; |
|
231 <a name="l00221"></a>00221 } |
|
232 <a name="l00222"></a>00222 pRec = pGetCharTableRecord(UNICODE_BULLET_OPERATOR); |
|
233 <a name="l00223"></a>00223 <span class="keywordflow">if</span> (pRec != NULL) { |
|
234 <a name="l00224"></a>00224 <span class="keywordflow">return</span> pRec->ucLocal; |
|
235 <a name="l00225"></a>00225 } |
|
236 <a name="l00226"></a>00226 pRec = pGetCharTableRecord(UNICODE_MIDDLE_DOT); |
|
237 <a name="l00227"></a>00227 <span class="keywordflow">if</span> (pRec != NULL) { |
|
238 <a name="l00228"></a>00228 <span class="keywordflow">return</span> pRec->ucLocal; |
|
239 <a name="l00229"></a>00229 } |
|
240 <a name="l00230"></a>00230 } |
|
241 <a name="l00231"></a>00231 <span class="keywordflow">return</span> (UCHAR)<span class="charliteral">'.'</span>; |
|
242 <a name="l00232"></a>00232 <span class="preprocessor">#endif </span><span class="comment">/* __riscos */</span> |
|
243 <a name="l00233"></a>00233 } <span class="comment">/* end of ucGetBulletCharacter */</span> |
|
244 <a name="l00234"></a>00234 |
|
245 <a name="l00235"></a>00235 <span class="comment">/*</span> |
|
246 <a name="l00236"></a>00236 <span class="comment"> * ucGetNbspCharacter - get the local representation of the non-breaking space</span> |
|
247 <a name="l00237"></a>00237 <span class="comment"> */</span> |
|
248 <a name="l00238"></a>00238 UCHAR |
|
249 <a name="l00239"></a>00239 ucGetNbspCharacter(<span class="keywordtype">void</span>) |
|
250 <a name="l00240"></a>00240 { |
|
251 <a name="l00241"></a>00241 <span class="keyword">const</span> char_table_type *pRec; |
|
252 <a name="l00242"></a>00242 |
|
253 <a name="l00243"></a>00243 pRec = pGetCharTableRecord(0x00a0); <span class="comment">/* Unicode non-breaking space */</span> |
|
254 <a name="l00244"></a>00244 <span class="keywordflow">if</span> (pRec == NULL) { |
|
255 <a name="l00245"></a>00245 DBG_MSG(<span class="stringliteral">"Non-breaking space record not found"</span>); |
|
256 <a name="l00246"></a>00246 <span class="comment">/* No value found, use the best guess */</span> |
|
257 <a name="l00247"></a>00247 <span class="keywordflow">return</span> (UCHAR)0xa0; |
|
258 <a name="l00248"></a>00248 } |
|
259 <a name="l00249"></a>00249 <span class="keywordflow">return</span> pRec->ucLocal; |
|
260 <a name="l00250"></a>00250 } <span class="comment">/* end of ucGetNbspCharacter */</span> |
|
261 <a name="l00251"></a>00251 |
|
262 <a name="l00252"></a>00252 <span class="comment">/*</span> |
|
263 <a name="l00253"></a>00253 <span class="comment"> * bReadCharacterMappingTable - read the mapping table</span> |
|
264 <a name="l00254"></a>00254 <span class="comment"> *</span> |
|
265 <a name="l00255"></a>00255 <span class="comment"> * Read the character mapping table from file and have the contents sorted</span> |
|
266 <a name="l00256"></a>00256 <span class="comment"> *</span> |
|
267 <a name="l00257"></a>00257 <span class="comment"> * returns TRUE if successful, otherwise FALSE</span> |
|
268 <a name="l00258"></a>00258 <span class="comment"> */</span> |
|
269 <a name="l00259"></a>00259 BOOL |
|
270 <a name="l00260"></a>00260 bReadCharacterMappingTable(FILE *pFile) |
|
271 <a name="l00261"></a>00261 { |
|
272 <a name="l00262"></a>00262 <span class="keywordtype">char</span> *pcTmp; |
|
273 <a name="l00263"></a>00263 ULONG ulUnicode; |
|
274 <a name="l00264"></a>00264 UINT uiLocal; |
|
275 <a name="l00265"></a>00265 <span class="keywordtype">int</span> iFields; |
|
276 <a name="l00266"></a>00266 <span class="keywordtype">char</span> szLine[81]; |
|
277 <a name="l00267"></a>00267 |
|
278 <a name="l00268"></a>00268 <span class="keywordflow">if</span> (pFile == NULL) { |
|
279 <a name="l00269"></a>00269 <span class="keywordflow">return</span> FALSE; |
|
280 <a name="l00270"></a>00270 } |
|
281 <a name="l00271"></a>00271 |
|
282 <a name="l00272"></a>00272 <span class="comment">/* Clean the table first */</span> |
|
283 <a name="l00273"></a>00273 (void)memset(atCharTable, 0, <span class="keyword">sizeof</span>(atCharTable)); |
|
284 <a name="l00274"></a>00274 |
|
285 <a name="l00275"></a>00275 <span class="comment">/* Fill the table */</span> |
|
286 <a name="l00276"></a>00276 <span class="keywordflow">while</span> (fgets(szLine, (<span class="keywordtype">int</span>)<span class="keyword">sizeof</span>(szLine), pFile)) { |
|
287 <a name="l00277"></a>00277 <span class="keywordflow">if</span> (szLine[0] == <span class="charliteral">'#'</span> || |
|
288 <a name="l00278"></a>00278 szLine[0] == <span class="charliteral">'\r'</span> || |
|
289 <a name="l00279"></a>00279 szLine[0] == <span class="charliteral">'\n'</span>) { |
|
290 <a name="l00280"></a>00280 <span class="comment">/* Comment or empty line */</span> |
|
291 <a name="l00281"></a>00281 <span class="keywordflow">continue</span>; |
|
292 <a name="l00282"></a>00282 } |
|
293 <a name="l00283"></a>00283 iFields = sscanf(szLine, <span class="stringliteral">"%x %lx %*s"</span>, &uiLocal, &ulUnicode); |
|
294 <a name="l00284"></a>00284 <span class="keywordflow">if</span> (iFields != 2) { |
|
295 <a name="l00285"></a>00285 pcTmp = strchr(szLine, <span class="charliteral">'\r'</span>); |
|
296 <a name="l00286"></a>00286 <span class="keywordflow">if</span> (pcTmp != NULL) { |
|
297 <a name="l00287"></a>00287 *pcTmp = <span class="charliteral">'\0'</span>; |
|
298 <a name="l00288"></a>00288 } |
|
299 <a name="l00289"></a>00289 pcTmp = strchr(szLine, <span class="charliteral">'\n'</span>); |
|
300 <a name="l00290"></a>00290 <span class="keywordflow">if</span> (pcTmp != NULL) { |
|
301 <a name="l00291"></a>00291 *pcTmp = <span class="charliteral">'\0'</span>; |
|
302 <a name="l00292"></a>00292 } |
|
303 <a name="l00293"></a>00293 werr(0, <span class="stringliteral">"Syntax error in: '%s'"</span>, szLine); |
|
304 <a name="l00294"></a>00294 <span class="keywordflow">continue</span>; |
|
305 <a name="l00295"></a>00295 } |
|
306 <a name="l00296"></a>00296 <span class="keywordflow">if</span> (uiLocal > 0xff || ulUnicode > 0xffff) { |
|
307 <a name="l00297"></a>00297 werr(0, <span class="stringliteral">"Syntax error in: '%02x %04lx'"</span>, |
|
308 <a name="l00298"></a>00298 uiLocal, ulUnicode); |
|
309 <a name="l00299"></a>00299 <span class="keywordflow">continue</span>; |
|
310 <a name="l00300"></a>00300 } |
|
311 <a name="l00301"></a>00301 <span class="comment">/* Store only the relevant entries */</span> |
|
312 <a name="l00302"></a>00302 <span class="keywordflow">if</span> (uiLocal != ulUnicode || uiLocal >= 0x80) { |
|
313 <a name="l00303"></a>00303 atCharTable[tNextPosFree].ucLocal = (UCHAR)uiLocal; |
|
314 <a name="l00304"></a>00304 atCharTable[tNextPosFree].usUnicode = (USHORT)ulUnicode; |
|
315 <a name="l00305"></a>00305 tNextPosFree++; |
|
316 <a name="l00306"></a>00306 } |
|
317 <a name="l00307"></a>00307 <span class="keywordflow">if</span> (tNextPosFree >= elementsof(atCharTable)) { |
|
318 <a name="l00308"></a>00308 werr(0, <span class="stringliteral">"Too many entries in the character mapping "</span> |
|
319 <a name="l00309"></a>00309 <span class="stringliteral">"file. Ignoring the rest."</span>); |
|
320 <a name="l00310"></a>00310 <span class="keywordflow">break</span>; |
|
321 <a name="l00311"></a>00311 } |
|
322 <a name="l00312"></a>00312 } |
|
323 <a name="l00313"></a>00313 |
|
324 <a name="l00314"></a>00314 <span class="keywordflow">if</span> (tNextPosFree != 0) { |
|
325 <a name="l00315"></a>00315 DBG_HEX(atCharTable[0].usUnicode); |
|
326 <a name="l00316"></a>00316 DBG_HEX(atCharTable[tNextPosFree - 1].usUnicode); |
|
327 <a name="l00317"></a>00317 |
|
328 <a name="l00318"></a>00318 qsort(atCharTable, |
|
329 <a name="l00319"></a>00319 tNextPosFree, <span class="keyword">sizeof</span>(atCharTable[0]), |
|
330 <a name="l00320"></a>00320 iCompare); |
|
331 <a name="l00321"></a>00321 |
|
332 <a name="l00322"></a>00322 DBG_HEX(atCharTable[0].usUnicode); |
|
333 <a name="l00323"></a>00323 DBG_HEX(atCharTable[tNextPosFree - 1].usUnicode); |
|
334 <a name="l00324"></a>00324 } |
|
335 <a name="l00325"></a>00325 |
|
336 <a name="l00326"></a>00326 <span class="keywordflow">return</span> TRUE; |
|
337 <a name="l00327"></a>00327 } <span class="comment">/* end of bReadCharacterMappingTable */</span> |
|
338 <a name="l00328"></a>00328 |
|
339 <a name="l00329"></a>00329 <span class="comment">/*</span> |
|
340 <a name="l00330"></a>00330 <span class="comment"> * ulTranslateCharacters - Translate characters to local representation</span> |
|
341 <a name="l00331"></a>00331 <span class="comment"> *</span> |
|
342 <a name="l00332"></a>00332 <span class="comment"> * Translate all characters to local representation</span> |
|
343 <a name="l00333"></a>00333 <span class="comment"> *</span> |
|
344 <a name="l00334"></a>00334 <span class="comment"> * returns the translated character</span> |
|
345 <a name="l00335"></a>00335 <span class="comment"> */</span> |
|
346 <a name="l00336"></a>00336 ULONG |
|
347 <a name="l00337"></a>00337 ulTranslateCharacters(USHORT usChar, ULONG ulFileOffset, <span class="keywordtype">int</span> iWordVersion, |
|
348 <a name="l00338"></a>00338 conversion_type eConversionType, encoding_type eEncoding, |
|
349 <a name="l00339"></a>00339 BOOL bUseMacCharSet) |
|
350 <a name="l00340"></a>00340 { |
|
351 <a name="l00341"></a>00341 <span class="keyword">const</span> char_table_type *pTmp; |
|
352 <a name="l00342"></a>00342 <span class="keyword">const</span> USHORT *usCharSet; |
|
353 <a name="l00343"></a>00343 |
|
354 <a name="l00344"></a>00344 usCharSet = NULL; |
|
355 <a name="l00345"></a>00345 <span class="keywordflow">if</span> (bUseMacCharSet) { |
|
356 <a name="l00346"></a>00346 <span class="comment">/* Macintosh character set */</span> |
|
357 <a name="l00347"></a>00347 usCharSet = usMacRoman; |
|
358 <a name="l00348"></a>00348 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (iWordVersion == 0) { |
|
359 <a name="l00349"></a>00349 <span class="comment">/* DOS character set */</span> |
|
360 <a name="l00350"></a>00350 usCharSet = usCp850; |
|
361 <a name="l00351"></a>00351 } <span class="keywordflow">else</span> { |
|
362 <a name="l00352"></a>00352 <span class="comment">/* Windows character set */</span> |
|
363 <a name="l00353"></a>00353 <span class="keywordflow">switch</span> (eEncoding) { |
|
364 <a name="l00354"></a>00354 <span class="keywordflow">case</span> encoding_latin_2: |
|
365 <a name="l00355"></a>00355 usCharSet = usCp1250; |
|
366 <a name="l00356"></a>00356 <span class="keywordflow">break</span>; |
|
367 <a name="l00357"></a>00357 <span class="keywordflow">case</span> encoding_cyrillic: |
|
368 <a name="l00358"></a>00358 usCharSet = usCp1251; |
|
369 <a name="l00359"></a>00359 <span class="keywordflow">break</span>; |
|
370 <a name="l00360"></a>00360 <span class="keywordflow">case</span> encoding_latin_1: |
|
371 <a name="l00361"></a>00361 <span class="keywordflow">default</span>: |
|
372 <a name="l00362"></a>00362 usCharSet = usCp1252; |
|
373 <a name="l00363"></a>00363 <span class="keywordflow">break</span>; |
|
374 <a name="l00364"></a>00364 } |
|
375 <a name="l00365"></a>00365 } |
|
376 <a name="l00366"></a>00366 fail(usCharSet == NULL); |
|
377 <a name="l00367"></a>00367 <span class="keywordflow">if</span> (usChar >= 0x80 && usChar <= 0x9f) { |
|
378 <a name="l00368"></a>00368 <span class="comment">/* Translate implementation defined characters */</span> |
|
379 <a name="l00369"></a>00369 usChar = usCharSet[usChar - 0x80]; |
|
380 <a name="l00370"></a>00370 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (iWordVersion < 8 && usChar >= 0xa0 && usChar <= 0xff) { |
|
381 <a name="l00371"></a>00371 <span class="comment">/* Translate old character set to Unixcode */</span> |
|
382 <a name="l00372"></a>00372 usChar = usCharSet[usChar - 0x80]; |
|
383 <a name="l00373"></a>00373 } |
|
384 <a name="l00374"></a>00374 |
|
385 <a name="l00375"></a>00375 <span class="comment">/* Microsoft Unicode to real Unicode */</span> |
|
386 <a name="l00376"></a>00376 <span class="keywordflow">if</span> (usChar >= 0xf020 && usChar <= 0xf0ff) { |
|
387 <a name="l00377"></a>00377 DBG_HEX_C(usPrivateArea[usChar - 0xf020] == 0x003f, usChar); |
|
388 <a name="l00378"></a>00378 usChar = usPrivateArea[usChar - 0xf020]; |
|
389 <a name="l00379"></a>00379 } |
|
390 <a name="l00380"></a>00380 |
|
391 <a name="l00381"></a>00381 <span class="comment">/* Characters with a special meaning in Word */</span> |
|
392 <a name="l00382"></a>00382 <span class="keywordflow">switch</span> (usChar) { |
|
393 <a name="l00383"></a>00383 <span class="keywordflow">case</span> IGNORE_CHARACTER: |
|
394 <a name="l00384"></a>00384 <span class="keywordflow">case</span> FOOTNOTE_SEPARATOR: |
|
395 <a name="l00385"></a>00385 <span class="keywordflow">case</span> FOOTNOTE_CONTINUATION: |
|
396 <a name="l00386"></a>00386 <span class="keywordflow">case</span> ANNOTATION: |
|
397 <a name="l00387"></a>00387 <span class="keywordflow">case</span> FRAME: |
|
398 <a name="l00388"></a>00388 <span class="keywordflow">case</span> LINE_FEED: |
|
399 <a name="l00389"></a>00389 <span class="keywordflow">case</span> WORD_SOFT_HYPHEN: |
|
400 <a name="l00390"></a>00390 <span class="keywordflow">case</span> UNICODE_HYPHENATION_POINT: |
|
401 <a name="l00391"></a>00391 <span class="keywordflow">return</span> IGNORE_CHARACTER; |
|
402 <a name="l00392"></a>00392 <span class="keywordflow">case</span> PICTURE: |
|
403 <a name="l00393"></a>00393 <span class="keywordflow">case</span> TABLE_SEPARATOR: |
|
404 <a name="l00394"></a>00394 <span class="keywordflow">case</span> TAB: |
|
405 <a name="l00395"></a>00395 <span class="keywordflow">case</span> HARD_RETURN: |
|
406 <a name="l00396"></a>00396 <span class="keywordflow">case</span> PAGE_BREAK: |
|
407 <a name="l00397"></a>00397 <span class="keywordflow">case</span> PAR_END: |
|
408 <a name="l00398"></a>00398 <span class="keywordflow">case</span> COLUMN_FEED: |
|
409 <a name="l00399"></a>00399 <span class="keywordflow">return</span> (ULONG)usChar; |
|
410 <a name="l00400"></a>00400 <span class="keywordflow">case</span> FOOTNOTE_OR_ENDNOTE: |
|
411 <a name="l00401"></a>00401 NO_DBG_HEX(ulFileOffset); |
|
412 <a name="l00402"></a>00402 <span class="keywordflow">switch</span> (eGetNotetype(ulFileOffset)) { |
|
413 <a name="l00403"></a>00403 <span class="keywordflow">case</span> notetype_is_footnote: |
|
414 <a name="l00404"></a>00404 <span class="keywordflow">return</span> FOOTNOTE_CHAR; |
|
415 <a name="l00405"></a>00405 <span class="keywordflow">case</span> notetype_is_endnote: |
|
416 <a name="l00406"></a>00406 <span class="keywordflow">return</span> ENDNOTE_CHAR; |
|
417 <a name="l00407"></a>00407 <span class="keywordflow">default</span>: |
|
418 <a name="l00408"></a>00408 <span class="keywordflow">return</span> UNKNOWN_NOTE_CHAR; |
|
419 <a name="l00409"></a>00409 } |
|
420 <a name="l00410"></a>00410 <span class="keywordflow">case</span> WORD_UNBREAKABLE_JOIN: |
|
421 <a name="l00411"></a>00411 <span class="keywordflow">return</span> (ULONG)OUR_UNBREAKABLE_JOIN; |
|
422 <a name="l00412"></a>00412 <span class="keywordflow">default</span>: |
|
423 <a name="l00413"></a>00413 <span class="keywordflow">break</span>; |
|
424 <a name="l00414"></a>00414 } |
|
425 <a name="l00415"></a>00415 |
|
426 <a name="l00416"></a>00416 <span class="keywordflow">if</span> (eEncoding != encoding_utf_8) { |
|
427 <a name="l00417"></a>00417 <span class="comment">/* Latin characters in an oriental text */</span> |
|
428 <a name="l00418"></a>00418 <span class="keywordflow">if</span> (usChar >= 0xff01 && usChar <= 0xff5e) { |
|
429 <a name="l00419"></a>00419 usChar -= 0xfee0; |
|
430 <a name="l00420"></a>00420 } |
|
431 <a name="l00421"></a>00421 } |
|
432 <a name="l00422"></a>00422 |
|
433 <a name="l00423"></a>00423 <span class="keywordflow">if</span> (eEncoding == encoding_latin_1 && |
|
434 <a name="l00424"></a>00424 (eConversionType == conversion_ps || |
|
435 <a name="l00425"></a>00425 eConversionType == conversion_pdf)) { |
|
436 <a name="l00426"></a>00426 <span class="comment">/* Ugly, but it makes the PostScript and PDF look better */</span> |
|
437 <a name="l00427"></a>00427 <span class="keywordflow">switch</span> (usChar) { |
|
438 <a name="l00428"></a>00428 <span class="keywordflow">case</span> UNICODE_ELLIPSIS: |
|
439 <a name="l00429"></a>00429 <span class="keywordflow">return</span> 140; |
|
440 <a name="l00430"></a>00430 <span class="keywordflow">case</span> UNICODE_TRADEMARK_SIGN: |
|
441 <a name="l00431"></a>00431 <span class="keywordflow">return</span> 141; |
|
442 <a name="l00432"></a>00432 <span class="keywordflow">case</span> UNICODE_PER_MILLE_SIGN: |
|
443 <a name="l00433"></a>00433 <span class="keywordflow">return</span> 142; |
|
444 <a name="l00434"></a>00434 <span class="keywordflow">case</span> UNICODE_BULLET: |
|
445 <a name="l00435"></a>00435 <span class="keywordflow">case</span> UNICODE_BULLET_OPERATOR: |
|
446 <a name="l00436"></a>00436 <span class="keywordflow">case</span> UNICODE_BLACK_CLUB_SUIT: |
|
447 <a name="l00437"></a>00437 <span class="keywordflow">return</span> 143; |
|
448 <a name="l00438"></a>00438 <span class="keywordflow">case</span> UNICODE_LEFT_SINGLE_QMARK: |
|
449 <a name="l00439"></a>00439 <span class="keywordflow">return</span> 144; |
|
450 <a name="l00440"></a>00440 <span class="keywordflow">case</span> UNICODE_RIGHT_SINGLE_QMARK: |
|
451 <a name="l00441"></a>00441 <span class="keywordflow">return</span> 145; |
|
452 <a name="l00442"></a>00442 <span class="keywordflow">case</span> UNICODE_SINGLE_LEFT_ANGLE_QMARK: |
|
453 <a name="l00443"></a>00443 <span class="keywordflow">return</span> 146; |
|
454 <a name="l00444"></a>00444 <span class="keywordflow">case</span> UNICODE_SINGLE_RIGHT_ANGLE_QMARK: |
|
455 <a name="l00445"></a>00445 <span class="keywordflow">return</span> 147; |
|
456 <a name="l00446"></a>00446 <span class="keywordflow">case</span> UNICODE_LEFT_DOUBLE_QMARK: |
|
457 <a name="l00447"></a>00447 <span class="keywordflow">return</span> 148; |
|
458 <a name="l00448"></a>00448 <span class="keywordflow">case</span> UNICODE_RIGHT_DOUBLE_QMARK: |
|
459 <a name="l00449"></a>00449 <span class="keywordflow">return</span> 149; |
|
460 <a name="l00450"></a>00450 <span class="keywordflow">case</span> UNICODE_DOUBLE_LOW_9_QMARK: |
|
461 <a name="l00451"></a>00451 <span class="keywordflow">return</span> 150; |
|
462 <a name="l00452"></a>00452 <span class="keywordflow">case</span> UNICODE_EN_DASH: |
|
463 <a name="l00453"></a>00453 <span class="keywordflow">return</span> 151; |
|
464 <a name="l00454"></a>00454 <span class="keywordflow">case</span> UNICODE_EM_DASH: |
|
465 <a name="l00455"></a>00455 <span class="keywordflow">return</span> 152; |
|
466 <a name="l00456"></a>00456 <span class="keywordflow">case</span> UNICODE_MINUS_SIGN: |
|
467 <a name="l00457"></a>00457 <span class="keywordflow">return</span> 153; |
|
468 <a name="l00458"></a>00458 <span class="keywordflow">case</span> UNICODE_CAPITAL_LIGATURE_OE: |
|
469 <a name="l00459"></a>00459 <span class="keywordflow">return</span> 154; |
|
470 <a name="l00460"></a>00460 <span class="keywordflow">case</span> UNICODE_SMALL_LIGATURE_OE: |
|
471 <a name="l00461"></a>00461 <span class="keywordflow">return</span> 155; |
|
472 <a name="l00462"></a>00462 <span class="keywordflow">case</span> UNICODE_DAGGER: |
|
473 <a name="l00463"></a>00463 <span class="keywordflow">return</span> 156; |
|
474 <a name="l00464"></a>00464 <span class="keywordflow">case</span> UNICODE_DOUBLE_DAGGER: |
|
475 <a name="l00465"></a>00465 <span class="keywordflow">return</span> 157; |
|
476 <a name="l00466"></a>00466 <span class="keywordflow">case</span> UNICODE_SMALL_LIGATURE_FI: |
|
477 <a name="l00467"></a>00467 <span class="keywordflow">return</span> 158; |
|
478 <a name="l00468"></a>00468 <span class="keywordflow">case</span> UNICODE_SMALL_LIGATURE_FL: |
|
479 <a name="l00469"></a>00469 <span class="keywordflow">return</span> 159; |
|
480 <a name="l00470"></a>00470 <span class="keywordflow">default</span>: |
|
481 <a name="l00471"></a>00471 <span class="keywordflow">break</span>; |
|
482 <a name="l00472"></a>00472 } |
|
483 <a name="l00473"></a>00473 } |
|
484 <a name="l00474"></a>00474 |
|
485 <a name="l00475"></a>00475 <span class="keywordflow">if</span> (eConversionType == conversion_pdf) { |
|
486 <a name="l00476"></a>00476 <span class="keywordflow">if</span> (eEncoding == encoding_latin_1) { |
|
487 <a name="l00477"></a>00477 <span class="keywordflow">switch</span> (usChar) { |
|
488 <a name="l00478"></a>00478 <span class="keywordflow">case</span> UNICODE_EURO_SIGN: |
|
489 <a name="l00479"></a>00479 <span class="keywordflow">return</span> 128; |
|
490 <a name="l00480"></a>00480 <span class="keywordflow">default</span>: |
|
491 <a name="l00481"></a>00481 <span class="keywordflow">break</span>; |
|
492 <a name="l00482"></a>00482 } |
|
493 <a name="l00483"></a>00483 } <span class="keywordflow">else</span> <span class="keywordflow">if</span> (eEncoding == encoding_latin_2) { |
|
494 <a name="l00484"></a>00484 <span class="keywordflow">switch</span> (usChar) { |
|
495 <a name="l00485"></a>00485 <span class="keywordflow">case</span> UNICODE_CAPITAL_D_WITH_STROKE: |
|
496 <a name="l00486"></a>00486 <span class="keywordflow">case</span> UNICODE_SMALL_D_WITH_STROKE: |
|
497 <a name="l00487"></a>00487 <span class="keywordflow">return</span> 0x3f; |
|
498 <a name="l00488"></a>00488 <span class="keywordflow">default</span>: |
|
499 <a name="l00489"></a>00489 <span class="keywordflow">break</span>; |
|
500 <a name="l00490"></a>00490 } |
|
501 <a name="l00491"></a>00491 } |
|
502 <a name="l00492"></a>00492 } |
|
503 <a name="l00493"></a>00493 |
|
504 <a name="l00494"></a>00494 <span class="keywordflow">if</span> (usChar < 0x80) { |
|
505 <a name="l00495"></a>00495 <span class="comment">/* US ASCII */</span> |
|
506 <a name="l00496"></a>00496 <span class="keywordflow">if</span> (usChar < 0x20 || usChar == 0x7f) { |
|
507 <a name="l00497"></a>00497 <span class="comment">/* Ignore control characters */</span> |
|
508 <a name="l00498"></a>00498 DBG_HEX(usChar); |
|
509 <a name="l00499"></a>00499 DBG_FIXME(); |
|
510 <a name="l00500"></a>00500 <span class="keywordflow">return</span> IGNORE_CHARACTER; |
|
511 <a name="l00501"></a>00501 } |
|
512 <a name="l00502"></a>00502 <span class="keywordflow">return</span> (ULONG)usChar; |
|
513 <a name="l00503"></a>00503 } |
|
514 <a name="l00504"></a>00504 |
|
515 <a name="l00505"></a>00505 <span class="keywordflow">if</span> (eEncoding == encoding_utf_8) { |
|
516 <a name="l00506"></a>00506 <span class="comment">/* No need to convert Unicode characters */</span> |
|
517 <a name="l00507"></a>00507 <span class="keywordflow">return</span> (ULONG)usChar; |
|
518 <a name="l00508"></a>00508 } |
|
519 <a name="l00509"></a>00509 |
|
520 <a name="l00510"></a>00510 <span class="comment">/* Unicode to local representation */</span> |
|
521 <a name="l00511"></a>00511 pTmp = pGetCharTableRecord(usChar); |
|
522 <a name="l00512"></a>00512 <span class="keywordflow">if</span> (pTmp != NULL) { |
|
523 <a name="l00513"></a>00513 DBG_HEX_C(usChar >= 0x7f && usChar <= 0x9f, usChar); |
|
524 <a name="l00514"></a>00514 <span class="keywordflow">return</span> (ULONG)pTmp->ucLocal; |
|
525 <a name="l00515"></a>00515 } |
|
526 <a name="l00516"></a>00516 |
|
527 <a name="l00517"></a>00517 <span class="comment">/* Fancy characters to simple US ASCII */</span> |
|
528 <a name="l00518"></a>00518 <span class="keywordflow">switch</span> (usChar) { |
|
529 <a name="l00519"></a>00519 <span class="keywordflow">case</span> UNICODE_SMALL_F_HOOK: |
|
530 <a name="l00520"></a>00520 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'f'</span>; |
|
531 <a name="l00521"></a>00521 <span class="keywordflow">case</span> UNICODE_GREEK_CAPITAL_CHI: |
|
532 <a name="l00522"></a>00522 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'X'</span>; |
|
533 <a name="l00523"></a>00523 <span class="keywordflow">case</span> UNICODE_GREEK_SMALL_UPSILON: |
|
534 <a name="l00524"></a>00524 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'v'</span>; |
|
535 <a name="l00525"></a>00525 <span class="keywordflow">case</span> UNICODE_MODIFIER_CIRCUMFLEX: |
|
536 <a name="l00526"></a>00526 <span class="keywordflow">case</span> UNICODE_UPWARDS_ARROW: |
|
537 <a name="l00527"></a>00527 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'^'</span>; |
|
538 <a name="l00528"></a>00528 <span class="keywordflow">case</span> UNICODE_SMALL_TILDE: |
|
539 <a name="l00529"></a>00529 <span class="keywordflow">case</span> UNICODE_TILDE_OPERATOR: |
|
540 <a name="l00530"></a>00530 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'~'</span>; |
|
541 <a name="l00531"></a>00531 <span class="keywordflow">case</span> UNICODE_EN_QUAD: |
|
542 <a name="l00532"></a>00532 <span class="keywordflow">case</span> UNICODE_EM_QUAD: |
|
543 <a name="l00533"></a>00533 <span class="keywordflow">case</span> UNICODE_EN_SPACE: |
|
544 <a name="l00534"></a>00534 <span class="keywordflow">case</span> UNICODE_EM_SPACE: |
|
545 <a name="l00535"></a>00535 <span class="keywordflow">case</span> UNICODE_THREE_PER_EM_SPACE: |
|
546 <a name="l00536"></a>00536 <span class="keywordflow">case</span> UNICODE_FOUR_PER_EM_SPACE: |
|
547 <a name="l00537"></a>00537 <span class="keywordflow">case</span> UNICODE_SIX_PER_EM_SPACE: |
|
548 <a name="l00538"></a>00538 <span class="keywordflow">case</span> UNICODE_FIGURE_SPACE: |
|
549 <a name="l00539"></a>00539 <span class="keywordflow">case</span> UNICODE_PUNCTUATION_SPACE: |
|
550 <a name="l00540"></a>00540 <span class="keywordflow">case</span> UNICODE_THIN_SPACE: |
|
551 <a name="l00541"></a>00541 <span class="keywordflow">case</span> UNICODE_NARROW_NO_BREAK_SPACE: |
|
552 <a name="l00542"></a>00542 <span class="keywordflow">case</span> UNICODE_LIGHT_SHADE: |
|
553 <a name="l00543"></a>00543 <span class="keywordflow">case</span> UNICODE_MEDIUM_SHADE: |
|
554 <a name="l00544"></a>00544 <span class="keywordflow">case</span> UNICODE_DARK_SHADE: |
|
555 <a name="l00545"></a>00545 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">' '</span>; |
|
556 <a name="l00546"></a>00546 <span class="keywordflow">case</span> UNICODE_LEFT_DOUBLE_QMARK: |
|
557 <a name="l00547"></a>00547 <span class="keywordflow">case</span> UNICODE_RIGHT_DOUBLE_QMARK: |
|
558 <a name="l00548"></a>00548 <span class="keywordflow">case</span> UNICODE_DOUBLE_LOW_9_QMARK: |
|
559 <a name="l00549"></a>00549 <span class="keywordflow">case</span> UNICODE_DOUBLE_HIGH_REV_9_QMARK: |
|
560 <a name="l00550"></a>00550 <span class="keywordflow">case</span> UNICODE_DOUBLE_PRIME: |
|
561 <a name="l00551"></a>00551 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'"'</span>; |
|
562 <a name="l00552"></a>00552 <span class="keywordflow">case</span> UNICODE_LEFT_SINGLE_QMARK: |
|
563 <a name="l00553"></a>00553 <span class="keywordflow">case</span> UNICODE_RIGHT_SINGLE_QMARK: |
|
564 <a name="l00554"></a>00554 <span class="keywordflow">case</span> UNICODE_SINGLE_LOW_9_QMARK: |
|
565 <a name="l00555"></a>00555 <span class="keywordflow">case</span> UNICODE_SINGLE_HIGH_REV_9_QMARK: |
|
566 <a name="l00556"></a>00556 <span class="keywordflow">case</span> UNICODE_PRIME: |
|
567 <a name="l00557"></a>00557 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'\''</span>; |
|
568 <a name="l00558"></a>00558 <span class="keywordflow">case</span> UNICODE_HYPHEN: |
|
569 <a name="l00559"></a>00559 <span class="keywordflow">case</span> UNICODE_NON_BREAKING_HYPHEN: |
|
570 <a name="l00560"></a>00560 <span class="keywordflow">case</span> UNICODE_FIGURE_DASH: |
|
571 <a name="l00561"></a>00561 <span class="keywordflow">case</span> UNICODE_EN_DASH: |
|
572 <a name="l00562"></a>00562 <span class="keywordflow">case</span> UNICODE_EM_DASH: |
|
573 <a name="l00563"></a>00563 <span class="keywordflow">case</span> UNICODE_HORIZONTAL_BAR: |
|
574 <a name="l00564"></a>00564 <span class="keywordflow">case</span> UNICODE_MINUS_SIGN: |
|
575 <a name="l00565"></a>00565 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_HORIZONTAL: |
|
576 <a name="l00566"></a>00566 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_HORIZONTAL: |
|
577 <a name="l00567"></a>00567 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'-'</span>; |
|
578 <a name="l00568"></a>00568 <span class="keywordflow">case</span> UNICODE_DOUBLE_VERTICAL_LINE: |
|
579 <a name="l00569"></a>00569 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_VERTICAL: |
|
580 <a name="l00570"></a>00570 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_VERTICAL: |
|
581 <a name="l00571"></a>00571 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'|'</span>; |
|
582 <a name="l00572"></a>00572 <span class="keywordflow">case</span> UNICODE_DOUBLE_LOW_LINE: |
|
583 <a name="l00573"></a>00573 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'_'</span>; |
|
584 <a name="l00574"></a>00574 <span class="keywordflow">case</span> UNICODE_DAGGER: |
|
585 <a name="l00575"></a>00575 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'+'</span>; |
|
586 <a name="l00576"></a>00576 <span class="keywordflow">case</span> UNICODE_DOUBLE_DAGGER: |
|
587 <a name="l00577"></a>00577 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'#'</span>; |
|
588 <a name="l00578"></a>00578 <span class="keywordflow">case</span> UNICODE_BULLET: |
|
589 <a name="l00579"></a>00579 <span class="keywordflow">case</span> UNICODE_BULLET_OPERATOR: |
|
590 <a name="l00580"></a>00580 <span class="keywordflow">case</span> UNICODE_BLACK_CLUB_SUIT: |
|
591 <a name="l00581"></a>00581 <span class="keywordflow">return</span> (ULONG)ucGetBulletCharacter(eConversionType, eEncoding); |
|
592 <a name="l00582"></a>00582 <span class="keywordflow">case</span> UNICODE_ONE_DOT_LEADER: |
|
593 <a name="l00583"></a>00583 <span class="keywordflow">case</span> UNICODE_TWO_DOT_LEADER: |
|
594 <a name="l00584"></a>00584 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'.'</span>; |
|
595 <a name="l00585"></a>00585 <span class="keywordflow">case</span> UNICODE_ELLIPSIS: |
|
596 <a name="l00586"></a>00586 <span class="preprocessor">#if defined(__riscos)</span> |
|
597 <a name="l00587"></a>00587 <span class="preprocessor"></span> <span class="keywordflow">return</span> (ULONG)OUR_ELLIPSIS; |
|
598 <a name="l00588"></a>00588 <span class="preprocessor">#else</span> |
|
599 <a name="l00589"></a>00589 <span class="preprocessor"></span> <span class="keywordflow">if</span> (ulFileOffset == 0) { |
|
600 <a name="l00590"></a>00590 <span class="keywordflow">return</span> (ULONG)OUR_ELLIPSIS; |
|
601 <a name="l00591"></a>00591 } |
|
602 <a name="l00592"></a>00592 <span class="keywordflow">return</span> UNICODE_ELLIPSIS; |
|
603 <a name="l00593"></a>00593 <span class="preprocessor">#endif </span><span class="comment">/* __riscos */</span> |
|
604 <a name="l00594"></a>00594 <span class="keywordflow">case</span> UNICODE_DOUBLE_LEFT_ANGLE_QMARK: |
|
605 <a name="l00595"></a>00595 <span class="keywordflow">case</span> UNICODE_TRIANGULAR_BULLET: |
|
606 <a name="l00596"></a>00596 <span class="keywordflow">case</span> UNICODE_SINGLE_LEFT_ANGLE_QMARK: |
|
607 <a name="l00597"></a>00597 <span class="keywordflow">case</span> UNICODE_LEFTWARDS_ARROW: |
|
608 <a name="l00598"></a>00598 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'<'</span>; |
|
609 <a name="l00599"></a>00599 <span class="keywordflow">case</span> UNICODE_DOUBLE_RIGHT_ANGLE_QMARK: |
|
610 <a name="l00600"></a>00600 <span class="keywordflow">case</span> UNICODE_SINGLE_RIGHT_ANGLE_QMARK: |
|
611 <a name="l00601"></a>00601 <span class="keywordflow">case</span> UNICODE_RIGHTWARDS_ARROW: |
|
612 <a name="l00602"></a>00602 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'>'</span>; |
|
613 <a name="l00603"></a>00603 <span class="keywordflow">case</span> UNICODE_UNDERTIE: |
|
614 <a name="l00604"></a>00604 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'-'</span>; |
|
615 <a name="l00605"></a>00605 <span class="keywordflow">case</span> UNICODE_N_ARY_SUMMATION: |
|
616 <a name="l00606"></a>00606 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'S'</span>; |
|
617 <a name="l00607"></a>00607 <span class="keywordflow">case</span> UNICODE_EURO_SIGN: |
|
618 <a name="l00608"></a>00608 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'E'</span>; |
|
619 <a name="l00609"></a>00609 <span class="keywordflow">case</span> UNICODE_CIRCLE: |
|
620 <a name="l00610"></a>00610 <span class="keywordflow">case</span> UNICODE_SQUARE: |
|
621 <a name="l00611"></a>00611 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'O'</span>; |
|
622 <a name="l00612"></a>00612 <span class="keywordflow">case</span> UNICODE_DIAMOND: |
|
623 <a name="l00613"></a>00613 <span class="keywordflow">return</span> (ULONG)OUR_DIAMOND; |
|
624 <a name="l00614"></a>00614 <span class="keywordflow">case</span> UNICODE_NUMERO_SIGN: |
|
625 <a name="l00615"></a>00615 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'N'</span>; |
|
626 <a name="l00616"></a>00616 <span class="keywordflow">case</span> UNICODE_KELVIN_SIGN: |
|
627 <a name="l00617"></a>00617 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'K'</span>; |
|
628 <a name="l00618"></a>00618 <span class="keywordflow">case</span> UNICODE_DOWNWARDS_ARROW: |
|
629 <a name="l00619"></a>00619 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'v'</span>; |
|
630 <a name="l00620"></a>00620 <span class="keywordflow">case</span> UNICODE_FRACTION_SLASH: |
|
631 <a name="l00621"></a>00621 <span class="keywordflow">case</span> UNICODE_DIVISION_SLASH: |
|
632 <a name="l00622"></a>00622 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'/'</span>; |
|
633 <a name="l00623"></a>00623 <span class="keywordflow">case</span> UNICODE_ASTERISK_OPERATOR: |
|
634 <a name="l00624"></a>00624 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'*'</span>; |
|
635 <a name="l00625"></a>00625 <span class="keywordflow">case</span> UNICODE_RATIO: |
|
636 <a name="l00626"></a>00626 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">':'</span>; |
|
637 <a name="l00627"></a>00627 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_DOWN_RIGHT: |
|
638 <a name="l00628"></a>00628 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_DOWN_AND_LEFT: |
|
639 <a name="l00629"></a>00629 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_UP_AND_RIGHT: |
|
640 <a name="l00630"></a>00630 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_UP_AND_LEFT: |
|
641 <a name="l00631"></a>00631 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_VERTICAL_AND_RIGHT: |
|
642 <a name="l00632"></a>00632 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_VERTICAL_AND_LEFT: |
|
643 <a name="l00633"></a>00633 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_DOWN_AND_HORIZONTAL: |
|
644 <a name="l00634"></a>00634 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_UP_AND_HORIZONTAL: |
|
645 <a name="l00635"></a>00635 <span class="keywordflow">case</span> UNICODE_BD_LIGHT_VERTICAL_AND_HORIZONTAL: |
|
646 <a name="l00636"></a>00636 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_DOWN_AND_RIGHT: |
|
647 <a name="l00637"></a>00637 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_DOWN_AND_LEFT: |
|
648 <a name="l00638"></a>00638 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_UP_AND_RIGHT: |
|
649 <a name="l00639"></a>00639 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_UP_AND_LEFT: |
|
650 <a name="l00640"></a>00640 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_VERTICAL_AND_RIGHT: |
|
651 <a name="l00641"></a>00641 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_VERTICAL_AND_LEFT: |
|
652 <a name="l00642"></a>00642 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_DOWN_AND_HORIZONTAL: |
|
653 <a name="l00643"></a>00643 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_UP_AND_HORIZONTAL: |
|
654 <a name="l00644"></a>00644 <span class="keywordflow">case</span> UNICODE_BD_DOUBLE_VERTICAL_AND_HORIZONTAL: |
|
655 <a name="l00645"></a>00645 <span class="keywordflow">case</span> UNICODE_BLACK_SQUARE: |
|
656 <a name="l00646"></a>00646 <span class="keywordflow">return</span> (ULONG)<span class="charliteral">'+'</span>; |
|
657 <a name="l00647"></a>00647 <span class="keywordflow">case</span> UNICODE_HAIR_SPACE: |
|
658 <a name="l00648"></a>00648 <span class="keywordflow">case</span> UNICODE_ZERO_WIDTH_SPACE: |
|
659 <a name="l00649"></a>00649 <span class="keywordflow">case</span> UNICODE_ZERO_WIDTH_NON_JOINER: |
|
660 <a name="l00650"></a>00650 <span class="keywordflow">case</span> UNICODE_ZERO_WIDTH_JOINER: |
|
661 <a name="l00651"></a>00651 <span class="keywordflow">case</span> UNICODE_LEFT_TO_RIGHT_MARK: |
|
662 <a name="l00652"></a>00652 <span class="keywordflow">case</span> UNICODE_RIGHT_TO_LEFT_MARK: |
|
663 <a name="l00653"></a>00653 <span class="keywordflow">case</span> UNICODE_LEFT_TO_RIGHT_EMBEDDING: |
|
664 <a name="l00654"></a>00654 <span class="keywordflow">case</span> UNICODE_RIGHT_TO_LEFT_EMBEDDING: |
|
665 <a name="l00655"></a>00655 <span class="keywordflow">case</span> UNICODE_POP_DIRECTIONAL_FORMATTING: |
|
666 <a name="l00656"></a>00656 <span class="keywordflow">case</span> UNICODE_LEFT_TO_RIGHT_OVERRIDE: |
|
667 <a name="l00657"></a>00657 <span class="keywordflow">case</span> UNICODE_RIGHT_TO_LEFT_OVERRIDE: |
|
668 <a name="l00658"></a>00658 <span class="keywordflow">case</span> UNICODE_ZERO_WIDTH_NO_BREAK_SPACE: |
|
669 <a name="l00659"></a>00659 <span class="keywordflow">return</span> IGNORE_CHARACTER; |
|
670 <a name="l00660"></a>00660 <span class="keywordflow">default</span>: |
|
671 <a name="l00661"></a>00661 <span class="keywordflow">break</span>; |
|
672 <a name="l00662"></a>00662 } |
|
673 <a name="l00663"></a>00663 |
|
674 <a name="l00664"></a>00664 <span class="keywordflow">if</span> (usChar == UNICODE_TRADEMARK_SIGN) { |
|
675 <a name="l00665"></a>00665 <span class="comment">/*</span> |
|
676 <a name="l00666"></a>00666 <span class="comment"> * No local representation, it doesn't look like anything in</span> |
|
677 <a name="l00667"></a>00667 <span class="comment"> * US-ASCII and a question mark does more harm than good.</span> |
|
678 <a name="l00668"></a>00668 <span class="comment"> */</span> |
|
679 <a name="l00669"></a>00669 <span class="keywordflow">return</span> IGNORE_CHARACTER; |
|
680 <a name="l00670"></a>00670 } |
|
681 <a name="l00671"></a>00671 |
|
682 <a name="l00672"></a>00672 <span class="keywordflow">if</span> (usChar >= 0xa0 && usChar <= 0xff) { |
|
683 <a name="l00673"></a>00673 <span class="comment">/* Before Word 97, Word did't use Unicode */</span> |
|
684 <a name="l00674"></a>00674 <span class="keywordflow">return</span> (ULONG)usChar; |
|
685 <a name="l00675"></a>00675 } |
|
686 <a name="l00676"></a>00676 |
|
687 <a name="l00677"></a>00677 DBG_HEX_C(usChar < 0x3000 || usChar >= 0xd800, ulFileOffset); |
|
688 <a name="l00678"></a>00678 DBG_HEX_C(usChar < 0x3000 || usChar >= 0xd800, usChar); |
|
689 <a name="l00679"></a>00679 DBG_MSG_C(usChar >= 0xe000 && usChar < 0xf900, <span class="stringliteral">"Private Use Area"</span>); |
|
690 <a name="l00680"></a>00680 |
|
691 <a name="l00681"></a>00681 <span class="comment">/* Untranslated Unicode character */</span> |
|
692 <a name="l00682"></a>00682 <span class="keywordflow">return</span> 0x3f; |
|
693 <a name="l00683"></a>00683 } <span class="comment">/* end of ulTranslateCharacters */</span> |
|
694 <a name="l00684"></a>00684 |
|
695 <a name="l00685"></a>00685 <span class="comment">/*</span> |
|
696 <a name="l00686"></a>00686 <span class="comment"> * ulToUpper - convert letter to upper case</span> |
|
697 <a name="l00687"></a>00687 <span class="comment"> *</span> |
|
698 <a name="l00688"></a>00688 <span class="comment"> * This function converts a letter to upper case. Unlike toupper(3) this</span> |
|
699 <a name="l00689"></a>00689 <span class="comment"> * function is independent from the settings of locale. This comes in handy</span> |
|
700 <a name="l00690"></a>00690 <span class="comment"> * for people who have to read Word documents in more than one language or</span> |
|
701 <a name="l00691"></a>00691 <span class="comment"> * contain more than one language.</span> |
|
702 <a name="l00692"></a>00692 <span class="comment"> *</span> |
|
703 <a name="l00693"></a>00693 <span class="comment"> * returns the converted letter, or ulChar if the conversion was not possible.</span> |
|
704 <a name="l00694"></a>00694 <span class="comment"> */</span> |
|
705 <a name="l00695"></a>00695 ULONG |
|
706 <a name="l00696"></a>00696 ulToUpper(ULONG ulChar) |
|
707 <a name="l00697"></a>00697 { |
|
708 <a name="l00698"></a>00698 <span class="keywordflow">if</span> (ulChar < 0x80) { |
|
709 <a name="l00699"></a>00699 <span class="comment">/* US ASCII: use standard function */</span> |
|
710 <a name="l00700"></a>00700 <span class="keywordflow">return</span> (ULONG)toupper((<span class="keywordtype">int</span>)ulChar); |
|
711 <a name="l00701"></a>00701 } |
|
712 <a name="l00702"></a>00702 <span class="keywordflow">if</span> (ulChar >= 0xe0 && ulChar <= 0xfe && ulChar != 0xf7) { |
|
713 <a name="l00703"></a>00703 <span class="comment">/*</span> |
|
714 <a name="l00704"></a>00704 <span class="comment"> * Lower case accented characters</span> |
|
715 <a name="l00705"></a>00705 <span class="comment"> * 0xf7 is Division sign; 0xd7 is Multiplication sign</span> |
|
716 <a name="l00706"></a>00706 <span class="comment"> * 0xff is y with diaeresis; 0xdf is Sharp s</span> |
|
717 <a name="l00707"></a>00707 <span class="comment"> */</span> |
|
718 <a name="l00708"></a>00708 <span class="keywordflow">return</span> ulChar & ~0x20; |
|
719 <a name="l00709"></a>00709 } |
|
720 <a name="l00710"></a>00710 <span class="preprocessor">#if defined(__STDC_ISO_10646__)</span> |
|
721 <a name="l00711"></a>00711 <span class="preprocessor"></span> <span class="comment">/*</span> |
|
722 <a name="l00712"></a>00712 <span class="comment"> * If this is ISO C99 and all locales have wchar_t = ISO 10646</span> |
|
723 <a name="l00713"></a>00713 <span class="comment"> * (e.g., glibc 2.2 or newer), then use standard function</span> |
|
724 <a name="l00714"></a>00714 <span class="comment"> */</span> |
|
725 <a name="l00715"></a>00715 <span class="keywordflow">if</span> (ulChar > 0xff) { |
|
726 <a name="l00716"></a>00716 <span class="keywordflow">return</span> (ULONG)towupper((wint_t)ulChar); |
|
727 <a name="l00717"></a>00717 } |
|
728 <a name="l00718"></a>00718 <span class="preprocessor">#endif </span><span class="comment">/* __STDC_ISO_10646__ */</span> |
|
729 <a name="l00719"></a>00719 <span class="keywordflow">return</span> ulChar; |
|
730 <a name="l00720"></a>00720 } <span class="comment">/* end of ulToUpper */</span> |
|
731 </pre></div></div> |
|
732 <hr size="1"/><address style="text-align: right;"><small>Generated by |
|
733 <a href="http://www.doxygen.org/index.html"> |
|
734 <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.6.2 </small></address> |
|
735 </body> |
|
736 </html> |
|