1 <!DOCTYPE html PUBLIC "-//W3C//DTD XHTML 1.0 Transitional//EN" "http://www.w3.org/TR/xhtml1/DTD/xhtml1-transitional.dtd"> |
|
2 <html xmlns="http://www.w3.org/1999/xhtml"> |
|
3 <head> |
|
4 <meta http-equiv="Content-Type" content="text/xhtml;charset=UTF-8"/> |
|
5 <title>TB9.2 Example Applications: examples/PIPS/antiword/src/worddos.c Source File</title> |
|
6 <link href="tabs.css" rel="stylesheet" type="text/css"/> |
|
7 <link href="doxygen.css" rel="stylesheet" type="text/css"/> |
|
8 </head> |
|
9 <body> |
|
10 <!-- Generated by Doxygen 1.6.2 --> |
|
11 <h1>examples/PIPS/antiword/src/worddos.c</h1><div class="fragment"><pre class="fragment"><a name="l00001"></a>00001 <span class="comment">/*</span> |
|
12 <a name="l00002"></a>00002 <span class="comment"> * worddos.c</span> |
|
13 <a name="l00003"></a>00003 <span class="comment"> * Copyright (C) 2002-2005 A.J. van Os; Released under GNU GPL</span> |
|
14 <a name="l00004"></a>00004 <span class="comment"> *</span> |
|
15 <a name="l00005"></a>00005 <span class="comment"> * Description:</span> |
|
16 <a name="l00006"></a>00006 <span class="comment"> * Deal with the DOS internals of a MS Word file</span> |
|
17 <a name="l00007"></a>00007 <span class="comment"> */</span> |
|
18 <a name="l00008"></a>00008 |
|
19 <a name="l00009"></a>00009 <span class="preprocessor">#include "antiword.h"</span> |
|
20 <a name="l00010"></a>00010 |
|
21 <a name="l00011"></a>00011 |
|
22 <a name="l00012"></a>00012 <span class="comment">/*</span> |
|
23 <a name="l00013"></a>00013 <span class="comment"> * bGetDocumentText - make a list of the text blocks of a Word document</span> |
|
24 <a name="l00014"></a>00014 <span class="comment"> *</span> |
|
25 <a name="l00015"></a>00015 <span class="comment"> * Return TRUE when succesful, otherwise FALSE</span> |
|
26 <a name="l00016"></a>00016 <span class="comment"> */</span> |
|
27 <a name="l00017"></a>00017 <span class="keyword">static</span> BOOL |
|
28 <a name="l00018"></a>00018 bGetDocumentText(FILE *pFile, <span class="keywordtype">long</span> lFilesize, <span class="keyword">const</span> UCHAR *aucHeader) |
|
29 <a name="l00019"></a>00019 { |
|
30 <a name="l00020"></a>00020 text_block_type tTextBlock; |
|
31 <a name="l00021"></a>00021 ULONG ulTextLen; |
|
32 <a name="l00022"></a>00022 BOOL bFastSaved; |
|
33 <a name="l00023"></a>00023 UCHAR ucDocStatus, ucVersion; |
|
34 <a name="l00024"></a>00024 |
|
35 <a name="l00025"></a>00025 fail(pFile == NULL); |
|
36 <a name="l00026"></a>00026 fail(lFilesize < 128); |
|
37 <a name="l00027"></a>00027 fail(aucHeader == NULL); |
|
38 <a name="l00028"></a>00028 |
|
39 <a name="l00029"></a>00029 <span class="comment">/* Get the status flags from the header */</span> |
|
40 <a name="l00030"></a>00030 ucDocStatus = ucGetByte(0x75, aucHeader); |
|
41 <a name="l00031"></a>00031 DBG_HEX(ucDocStatus); |
|
42 <a name="l00032"></a>00032 bFastSaved = (ucDocStatus & BIT(1)) != 0; |
|
43 <a name="l00033"></a>00033 DBG_MSG_C(bFastSaved, <span class="stringliteral">"This document is Fast Saved"</span>); |
|
44 <a name="l00034"></a>00034 ucVersion = ucGetByte(0x74, aucHeader); |
|
45 <a name="l00035"></a>00035 DBG_DEC(ucVersion); |
|
46 <a name="l00036"></a>00036 DBG_MSG_C(ucVersion == 0, <span class="stringliteral">"Written by Word 4.0 or earlier"</span>); |
|
47 <a name="l00037"></a>00037 DBG_MSG_C(ucVersion == 3, <span class="stringliteral">"Word 5.0 format, but not written by Word"</span>); |
|
48 <a name="l00038"></a>00038 DBG_MSG_C(ucVersion == 4, <span class="stringliteral">"Written by Word 5.x"</span>); |
|
49 <a name="l00039"></a>00039 <span class="keywordflow">if</span> (bFastSaved) { |
|
50 <a name="l00040"></a>00040 werr(0, <span class="stringliteral">"Word for DOS: autosave documents are not supported"</span>); |
|
51 <a name="l00041"></a>00041 <span class="keywordflow">return</span> FALSE; |
|
52 <a name="l00042"></a>00042 } |
|
53 <a name="l00043"></a>00043 |
|
54 <a name="l00044"></a>00044 <span class="comment">/* Get length information */</span> |
|
55 <a name="l00045"></a>00045 ulTextLen = ulGetLong(0x0e, aucHeader); |
|
56 <a name="l00046"></a>00046 DBG_HEX(ulTextLen); |
|
57 <a name="l00047"></a>00047 ulTextLen -= 128; |
|
58 <a name="l00048"></a>00048 DBG_DEC(ulTextLen); |
|
59 <a name="l00049"></a>00049 tTextBlock.ulFileOffset = 128; |
|
60 <a name="l00050"></a>00050 tTextBlock.ulCharPos = 128; |
|
61 <a name="l00051"></a>00051 tTextBlock.ulLength = ulTextLen; |
|
62 <a name="l00052"></a>00052 tTextBlock.bUsesUnicode = FALSE; |
|
63 <a name="l00053"></a>00053 tTextBlock.usPropMod = IGNORE_PROPMOD; |
|
64 <a name="l00054"></a>00054 <span class="keywordflow">if</span> (!bAdd2TextBlockList(&tTextBlock)) { |
|
65 <a name="l00055"></a>00055 DBG_HEX(tTextBlock.ulFileOffset); |
|
66 <a name="l00056"></a>00056 DBG_HEX(tTextBlock.ulCharPos); |
|
67 <a name="l00057"></a>00057 DBG_DEC(tTextBlock.ulLength); |
|
68 <a name="l00058"></a>00058 DBG_DEC(tTextBlock.bUsesUnicode); |
|
69 <a name="l00059"></a>00059 DBG_DEC(tTextBlock.usPropMod); |
|
70 <a name="l00060"></a>00060 <span class="keywordflow">return</span> FALSE; |
|
71 <a name="l00061"></a>00061 } |
|
72 <a name="l00062"></a>00062 <span class="keywordflow">return</span> TRUE; |
|
73 <a name="l00063"></a>00063 } <span class="comment">/* end of bGetDocumentText */</span> |
|
74 <a name="l00064"></a>00064 |
|
75 <a name="l00065"></a>00065 <span class="comment">/*</span> |
|
76 <a name="l00066"></a>00066 <span class="comment"> * iInitDocumentDOS - initialize an DOS document</span> |
|
77 <a name="l00067"></a>00067 <span class="comment"> *</span> |
|
78 <a name="l00068"></a>00068 <span class="comment"> * Returns the version of Word that made the document or -1</span> |
|
79 <a name="l00069"></a>00069 <span class="comment"> */</span> |
|
80 <a name="l00070"></a>00070 <span class="keywordtype">int</span> |
|
81 <a name="l00071"></a>00071 iInitDocumentDOS(FILE *pFile, <span class="keywordtype">long</span> lFilesize) |
|
82 <a name="l00072"></a>00072 { |
|
83 <a name="l00073"></a>00073 <span class="keywordtype">int</span> iWordVersion; |
|
84 <a name="l00074"></a>00074 BOOL bSuccess; |
|
85 <a name="l00075"></a>00075 USHORT usIdent; |
|
86 <a name="l00076"></a>00076 UCHAR aucHeader[128]; |
|
87 <a name="l00077"></a>00077 |
|
88 <a name="l00078"></a>00078 fail(pFile == NULL); |
|
89 <a name="l00079"></a>00079 |
|
90 <a name="l00080"></a>00080 <span class="keywordflow">if</span> (lFilesize < 128) { |
|
91 <a name="l00081"></a>00081 <span class="keywordflow">return</span> -1; |
|
92 <a name="l00082"></a>00082 } |
|
93 <a name="l00083"></a>00083 |
|
94 <a name="l00084"></a>00084 <span class="comment">/* Read the headerblock */</span> |
|
95 <a name="l00085"></a>00085 <span class="keywordflow">if</span> (!bReadBytes(aucHeader, 128, 0x00, pFile)) { |
|
96 <a name="l00086"></a>00086 <span class="keywordflow">return</span> -1; |
|
97 <a name="l00087"></a>00087 } |
|
98 <a name="l00088"></a>00088 <span class="comment">/* Get the "magic number" from the header */</span> |
|
99 <a name="l00089"></a>00089 usIdent = usGetWord(0x00, aucHeader); |
|
100 <a name="l00090"></a>00090 DBG_HEX(usIdent); |
|
101 <a name="l00091"></a>00091 fail(usIdent != 0xbe31); <span class="comment">/* Word for DOS */</span> |
|
102 <a name="l00092"></a>00092 iWordVersion = iGetVersionNumber(aucHeader); |
|
103 <a name="l00093"></a>00093 <span class="keywordflow">if</span> (iWordVersion != 0) { |
|
104 <a name="l00094"></a>00094 werr(0, <span class="stringliteral">"This file is not from 'Word for DOS'."</span>); |
|
105 <a name="l00095"></a>00095 <span class="keywordflow">return</span> -1; |
|
106 <a name="l00096"></a>00096 } |
|
107 <a name="l00097"></a>00097 bSuccess = bGetDocumentText(pFile, lFilesize, aucHeader); |
|
108 <a name="l00098"></a>00098 <span class="keywordflow">if</span> (bSuccess) { |
|
109 <a name="l00099"></a>00099 vGetPropertyInfo(pFile, NULL, |
|
110 <a name="l00100"></a>00100 NULL, 0, NULL, 0, |
|
111 <a name="l00101"></a>00101 aucHeader, iWordVersion); |
|
112 <a name="l00102"></a>00102 vSetDefaultTabWidth(pFile, NULL, |
|
113 <a name="l00103"></a>00103 NULL, 0, NULL, 0, |
|
114 <a name="l00104"></a>00104 aucHeader, iWordVersion); |
|
115 <a name="l00105"></a>00105 vGetNotesInfo(pFile, NULL, |
|
116 <a name="l00106"></a>00106 NULL, 0, NULL, 0, |
|
117 <a name="l00107"></a>00107 aucHeader, iWordVersion); |
|
118 <a name="l00108"></a>00108 } |
|
119 <a name="l00109"></a>00109 <span class="keywordflow">return</span> bSuccess ? iWordVersion : -1; |
|
120 <a name="l00110"></a>00110 } <span class="comment">/* end of iInitDocumentDOS */</span> |
|
121 </pre></div></div> |
|
122 <hr size="1"/><address style="text-align: right;"><small>Generated by |
|
123 <a href="http://www.doxygen.org/index.html"> |
|
124 <img class="footer" src="doxygen.png" alt="doxygen"/></a> 1.6.2 </small></address> |
|
125 </body> |
|
126 </html> |
|