Subversion Repositories planix.SVN

Rev

Rev 2 | Blame | Compare with Previous | Last modification | View Log | RSS feed

/*
 * worddos.c
 * Copyright (C) 2002-2005 A.J. van Os; Released under GNU GPL
 *
 * Description:
 * Deal with the DOS internals of a MS Word file
 */

#include "antiword.h"


/*
 * bGetDocumentText - make a list of the text blocks of a Word document
 *
 * Return TRUE when succesful, otherwise FALSE
 */
static BOOL
bGetDocumentText(FILE *pFile, long lFilesize, const UCHAR *aucHeader)
{
        text_block_type tTextBlock;
        ULONG   ulTextLen;
        BOOL    bFastSaved;
        UCHAR   ucDocStatus, ucVersion;

        fail(pFile == NULL);
        fail(lFilesize < 128);
        fail(aucHeader == NULL);

        /* Get the status flags from the header */
        ucDocStatus = ucGetByte(0x75, aucHeader);
        DBG_HEX(ucDocStatus);
        bFastSaved = (ucDocStatus & BIT(1)) != 0;
        DBG_MSG_C(bFastSaved, "This document is Fast Saved");
        ucVersion = ucGetByte(0x74, aucHeader);
        DBG_DEC(ucVersion);
        DBG_MSG_C(ucVersion == 0, "Written by Word 4.0 or earlier");
        DBG_MSG_C(ucVersion == 3, "Word 5.0 format, but not written by Word");
        DBG_MSG_C(ucVersion == 4, "Written by Word 5.x");
        if (bFastSaved) {
                werr(0, "Word for DOS: autosave documents are not supported");
                return FALSE;
        }

        /* Get length information */
        ulTextLen = ulGetLong(0x0e, aucHeader);
        DBG_HEX(ulTextLen);
        ulTextLen -= 128;
        DBG_DEC(ulTextLen);
        tTextBlock.ulFileOffset = 128;
        tTextBlock.ulCharPos = 128;
        tTextBlock.ulLength = ulTextLen;
        tTextBlock.bUsesUnicode = FALSE;
        tTextBlock.usPropMod = IGNORE_PROPMOD;
        if (!bAdd2TextBlockList(&tTextBlock)) {
                DBG_HEX(tTextBlock.ulFileOffset);
                DBG_HEX(tTextBlock.ulCharPos);
                DBG_DEC(tTextBlock.ulLength);
                DBG_DEC(tTextBlock.bUsesUnicode);
                DBG_DEC(tTextBlock.usPropMod);
                return FALSE;
        }
        return TRUE;
} /* end of bGetDocumentText */

/*
 * iInitDocumentDOS - initialize an DOS document
 *
 * Returns the version of Word that made the document or -1
 */
int
iInitDocumentDOS(FILE *pFile, long lFilesize)
{
        int     iWordVersion;
        BOOL    bSuccess;
        USHORT  usIdent;
        UCHAR   aucHeader[128];

        fail(pFile == NULL);

        if (lFilesize < 128) {
                return -1;
        }

        /* Read the headerblock */
        if (!bReadBytes(aucHeader, 128, 0x00, pFile)) {
                return -1;
        }
        /* Get the "magic number" from the header */
        usIdent = usGetWord(0x00, aucHeader);
        DBG_HEX(usIdent);
        fail(usIdent != 0xbe31);        /* Word for DOS */
        iWordVersion = iGetVersionNumber(aucHeader);
        if (iWordVersion != 0) {
                werr(0, "This file is not from 'Word for DOS'.");
                return -1;
        }
        bSuccess = bGetDocumentText(pFile, lFilesize, aucHeader);
        if (bSuccess) {
                vGetPropertyInfo(pFile, NULL,
                                NULL, 0, NULL, 0,
                                aucHeader, iWordVersion);
                vSetDefaultTabWidth(pFile, NULL,
                                NULL, 0, NULL, 0,
                                aucHeader, iWordVersion);
                vGetNotesInfo(pFile, NULL,
                                NULL, 0, NULL, 0,
                                aucHeader, iWordVersion);
        }
        return bSuccess ? iWordVersion : -1;
} /* end of iInitDocumentDOS */