diff options
Diffstat (limited to 'sw/source/filter/ww8/ww8scan.hxx')
-rw-r--r-- | sw/source/filter/ww8/ww8scan.hxx | 1784 |
1 files changed, 1784 insertions, 0 deletions
diff --git a/sw/source/filter/ww8/ww8scan.hxx b/sw/source/filter/ww8/ww8scan.hxx new file mode 100644 index 000000000000..33d40bcf4c0d --- /dev/null +++ b/sw/source/filter/ww8/ww8scan.hxx @@ -0,0 +1,1784 @@ +/************************************************************************* + * + * DO NOT ALTER OR REMOVE COPYRIGHT NOTICES OR THIS FILE HEADER. + * + * Copyright 2000, 2010 Oracle and/or its affiliates. + * + * OpenOffice.org - a multi-platform office productivity suite + * + * This file is part of OpenOffice.org. + * + * OpenOffice.org is free software: you can redistribute it and/or modify + * it under the terms of the GNU Lesser General Public License version 3 + * only, as published by the Free Software Foundation. + * + * OpenOffice.org is distributed in the hope that it will be useful, + * but WITHOUT ANY WARRANTY; without even the implied warranty of + * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the + * GNU Lesser General Public License version 3 for more details + * (a copy is included in the LICENSE file that accompanied this code). + * + * You should have received a copy of the GNU Lesser General Public License + * version 3 along with OpenOffice.org. If not, see + * <http://www.openoffice.org/license.html> + * for a copy of the LGPLv3 License. + * + ************************************************************************/ + +/* -*- Mode: C; tab-width: 4; indent-tabs-mode: nil -*- */ + +#ifndef _WW8SCAN_HXX +#define _WW8SCAN_HXX + +#ifndef LONG_MAX +#include <limits.h> +#endif +#include <stack> +#include <vector> +#include <list> +#include <algorithm> +#include <tools/solar.h> // UINTXX +#include <tools/datetime.hxx> +#include <tools/stream.hxx> +#include <tools/string.hxx> +#include <errhdl.hxx> // ASSERT() +#include "hash_wrap.hxx" +#include "sortedarray.hxx" + +#ifndef WW8STRUC_HXX +#include "ww8struc.hxx" // FIB, STSHI, STD... +#endif +#include <types.hxx> + +#include <unomid.h> + +#define APPEND_CONST_ASC(s) AppendAscii(RTL_CONSTASCII_STRINGPARAM(s)) +#define ASSIGN_CONST_ASC(s) AssignAscii(RTL_CONSTASCII_STRINGPARAM(s)) +#define CREATE_CONST_ASC(s) String::CreateFromAscii( \ + RTL_CONSTASCII_STRINGPARAM(s)) + + + +//--Line below which the code has meaningful comments + +//Commonly used string literals for stream and storage names in word docs +namespace SL +{ +# define DEFCONSTSTRINGARRAY(X) extern const char a##X[sizeof("" #X "")] + DEFCONSTSTRINGARRAY(ObjectPool); + DEFCONSTSTRINGARRAY(1Table); + DEFCONSTSTRINGARRAY(0Table); + DEFCONSTSTRINGARRAY(Data); + DEFCONSTSTRINGARRAY(CheckBox); + DEFCONSTSTRINGARRAY(ListBox); + DEFCONSTSTRINGARRAY(TextBox); + DEFCONSTSTRINGARRAY(TextField); + DEFCONSTSTRINGARRAY(MSMacroCmds); +} + +/** + winword strings are typically Belt and Braces strings preceeded with a + pascal style count, and ending with a c style 0 terminator. 16bit chars + and count for ww8+ and 8bit chars and count for ww7-. The count and 0 + can be checked for integrity to catch errors (e.g. lotus created documents) + where in error 8bit strings are used instead of 16bits strings for style + names. +*/ +template<class C> class wwString +{ +public: + static bool TestBeltAndBraces(const SvStream& rStrm); + //move the other string related code into this class as time goes by +}; + +typedef wwString<sal_uInt16> ww8String; + +struct SprmInfo +{ + sal_uInt16 nId; ///< A ww8 sprm is hardcoded as 16bits + unsigned int nLen : 6; + unsigned int nVari : 2; +}; + +struct SprmInfoHash +{ + size_t operator()(const SprmInfo &a) const + { + return a.nId; + } +}; + +typedef ww::WrappedHash<SprmInfo, SprmInfoHash> wwSprmSearcher; +typedef ww::WrappedHash<sal_uInt16> wwSprmSequence; + +/** + wwSprmParser knows how to take a sequence of bytes and split it up into + sprms and their arguments +*/ +class wwSprmParser +{ +private: + ww::WordVersion meVersion; + BYTE mnDelta; + const wwSprmSearcher *mpKnownSprms; + static const wwSprmSearcher* GetWW8SprmSearcher(); + static const wwSprmSearcher* GetWW6SprmSearcher(); + static const wwSprmSearcher* GetWW2SprmSearcher(); + + SprmInfo GetSprmInfo(sal_uInt16 nId) const; + + BYTE SprmDataOfs(sal_uInt16 nId) const; + + enum SprmType {L_FIX=0, L_VAR=1, L_VAR2=2}; +public: + //7- ids are very different to 8+ ones + wwSprmParser(ww::WordVersion eVersion); + /// Return the SPRM id at the beginning of this byte sequence + sal_uInt16 GetSprmId(const sal_uInt8* pSp) const; + + USHORT GetSprmSize(sal_uInt16 nId, const sal_uInt8* pSprm) const; + + /// Get known len of a sprms head, the bytes of the sprm id + any bytes + /// reserved to hold a variable length + USHORT DistanceToData(sal_uInt16 nId) const; + + /// Get len of a sprms data area, ignoring the bytes of the sprm id and + /// ignoring any len bytes. Reports the remaining data after those bytes + USHORT GetSprmTailLen(sal_uInt16 nId, const sal_uInt8 * pSprm) const; + + /// The minimum acceptable sprm len possible for this type of parser + int MinSprmLen() const { return (IsSevenMinus(meVersion)) ? 2 : 3; } + + inline int getVersion() const { return meVersion; } //cmc, I'm dubious about the usage of this, how can it be 0 +}; + +//--Line abovewhich the code has meaningful comments + +class WW8Fib; +class WW8ScannerBase; +class WW8PLCFspecial; +struct WW8PLCFxDesc; +class WW8PLCFx_PCD; + +String WW8ReadPString( SvStream& rStrm, rtl_TextEncoding eEnc, + bool bAtEndSeekRel1 = true); + +/** + The following method reads a 2Byte unicode string. If bAtEndSeekRel1 is set, + exactly ONE byte is skipped If nChars is set then that number of characters + (not bytes) is read, if its not set, the first character read is the length +*/ +String WW8Read_xstz(SvStream& rStrm, USHORT nChars, bool bAtEndSeekRel1); + +/** + reads array of strings (see MS documentation: STring TaBle stored in File) + returns NOT the original pascal strings but an array of converted char* + + attention: the *extra data* of each string are SKIPPED and ignored + */ +void WW8ReadSTTBF(bool bVer8, SvStream& rStrm, UINT32 nStart, INT32 nLen, + USHORT nExtraLen, rtl_TextEncoding eCS, ::std::vector<String> &rArray, + ::std::vector<ww::bytes>* pExtraArray = 0, ::std::vector<String>* pValueArray = 0); + +struct WW8FieldDesc +{ + long nLen; ///< Gesamtlaenge ( zum Text ueberlesen ) + WW8_CP nSCode; ///< Anfang Befehlscode + WW8_CP nLCode; ///< Laenge + WW8_CP nSRes; ///< Anfang Ergebnis + WW8_CP nLRes; ///< Laenge ( == 0, falls kein Ergebnis ) + USHORT nId; ///< WW-Id fuer Felder + BYTE nOpt; ///< WW-Flags ( z.B.: vom User geaendert ) + BYTE bCodeNest:1; ///< Befehl rekursiv verwendet + BYTE bResNest:1; ///< Befehl in Resultat eingefuegt +}; + +struct WW8PLCFxSave1 +{ + ULONG nPLCFxPos; + ULONG nPLCFxPos2; ///< fuer PLCF_Cp_Fkp: PieceIter-Pos + long nPLCFxMemOfs; + WW8_CP nStartCp; ///< for cp based iterator like PAP and CHP + long nCpOfs; + WW8_FC nStartFC; + WW8_CP nAttrStart; + WW8_CP nAttrEnd; + bool bLineEnd; +}; + +/** + u.a. fuer Felder, also genausoviele Attr wie Positionen, + falls Ctor-Param bNoEnd = false +*/ +class WW8PLCFspecial // Iterator fuer PLCFs +{ +private: + INT32* pPLCF_PosArray; ///< Pointer auf Pos-Array und auf ganze Struktur + BYTE* pPLCF_Contents; ///< Pointer auf Inhalts-Array-Teil des Pos-Array + long nIMax; ///< Anzahl der Elemente + long nIdx; ///< Merker, wo wir gerade sind + long nStru; +public: + WW8PLCFspecial( SvStream* pSt, long nFilePos, long nPLCF, + long nStruct, long nStartPos = -1 ); + ~WW8PLCFspecial() { delete[] pPLCF_PosArray; } + long GetIdx() const { return nIdx; } + void SetIdx( long nI ) { nIdx = nI; } + long GetIMax() const { return nIMax; } + bool SeekPos(long nPos); // geht ueber FC- bzw. CP-Wert + // bzw. naechste groesseren Wert + bool SeekPosExact(long nPos); + INT32 Where() const + { return ( nIdx >= nIMax ) ? SAL_MAX_INT32 : pPLCF_PosArray[nIdx]; } + bool Get(WW8_CP& rStart, void*& rpValue) const; + bool GetData(long nIdx, WW8_CP& rPos, void*& rpValue) const; + + const void* GetData( long nInIdx ) const + { + return ( nInIdx >= nIMax ) ? 0 + : (const void*)&pPLCF_Contents[nInIdx * nStru]; + } + INT32 GetPos( long nInIdx ) const + { return ( nInIdx >= nIMax ) ? SAL_MAX_INT32 : pPLCF_PosArray[nInIdx]; } + + WW8PLCFspecial& operator ++( int ) { nIdx++; return *this; } + WW8PLCFspecial& operator --( int ) { nIdx--; return *this; } +}; + +/** simple Iterator for SPRMs */ +class WW8SprmIter +{ +private: + const wwSprmParser &mrSprmParser; + // these members will be updated + const BYTE* pSprms; // remaining part of the SPRMs ( == start of akt. SPRM) + const BYTE* pAktParams; // start of akt. SPRM's parameters + USHORT nAktId; + USHORT nAktSize; + + long nRemLen; // length of remaining SPRMs (including akt. SPRM) + + void UpdateMyMembers(); +public: + explicit WW8SprmIter( const BYTE* pSprms_, long nLen_, + const wwSprmParser &rSprmParser); + void SetSprms( const BYTE* pSprms_, long nLen_ ); + const BYTE* FindSprm(USHORT nId); + const BYTE* operator ++( int ); + const BYTE* GetSprms() const + { return ( pSprms && (0 < nRemLen) ) ? pSprms : 0; } + const BYTE* GetAktParams() const { return pAktParams; } + USHORT GetAktId() const { return nAktId; } +private: + //No copying + WW8SprmIter(const WW8SprmIter&); + WW8SprmIter& operator=(const WW8SprmIter&); +}; + +/* u.a. fuer FKPs auf normale Attr., also ein Attr weniger als Positionen */ +class WW8PLCF // Iterator fuer PLCFs +{ +private: + WW8_CP* pPLCF_PosArray; // Pointer auf Pos-Array und auf ganze Struktur + BYTE* pPLCF_Contents; // Pointer auf Inhalts-Array-Teil des Pos-Array + INT32 nIMax; // Anzahl der Elemente + INT32 nIdx; + int nStru; + + void ReadPLCF( SvStream* pSt, WW8_FC nFilePos, INT32 nPLCF ); + + /* + Falls im Dok ein PLC fehlt und die FKPs solo dastehen, + machen wir uns hiermit einen PLC: + */ + void GeneratePLCF( SvStream* pSt, INT32 nPN, INT32 ncpN ); + + void MakeFailedPLCF(); +public: + WW8PLCF( SvStream* pSt, WW8_FC nFilePos, INT32 nPLCF, int nStruct, + WW8_CP nStartPos = -1 ); + + /* + folgender Ctor generiert ggfs. einen PLC aus nPN und ncpN + */ + WW8PLCF( SvStream* pSt, WW8_FC nFilePos, INT32 nPLCF, int nStruct, + WW8_CP nStartPos, INT32 nPN, INT32 ncpN ); + + ~WW8PLCF(){ delete[] pPLCF_PosArray; } + INT32 GetIdx() const { return nIdx; } + void SetIdx( INT32 nI ) { nIdx = nI; } + INT32 GetIMax() const { return nIMax; } + bool SeekPos(WW8_CP nPos); + WW8_CP Where() const; + bool Get(WW8_CP& rStart, WW8_CP& rEnd, void*& rpValue) const; + WW8PLCF& operator ++( int ) { if( nIdx < nIMax ) nIdx++; return *this; } + + const void* GetData( INT32 nInIdx ) const + { + return ( nInIdx >= nIMax ) ? 0 : + (const void*)&pPLCF_Contents[nInIdx * nStru]; + } +}; + +/* for Piece Table (.i.e. FastSave Table) */ +class WW8PLCFpcd +{ +friend class WW8PLCFpcd_Iter; + INT32* pPLCF_PosArray; // Pointer auf Pos-Array und auf ganze Struktur + BYTE* pPLCF_Contents; // Pointer auf Inhalts-Array-Teil des Pos-Array + long nIMax; + long nStru; +public: + WW8PLCFpcd( SvStream* pSt, long nFilePos, long nPLCF, long nStruct ); + ~WW8PLCFpcd(){ delete[] pPLCF_PosArray; } +}; + +/* mehrere WW8PLCFpcd_Iter koennen auf die gleiche WW8PLCFpcd zeigen !!! */ +class WW8PLCFpcd_Iter +{ +private: + WW8PLCFpcd& rPLCF; + long nIdx; + + //No copying + WW8PLCFpcd_Iter(const WW8PLCFpcd_Iter&); + WW8PLCFpcd_Iter& operator=(const WW8PLCFpcd_Iter&); +public: + WW8PLCFpcd_Iter( WW8PLCFpcd& rPLCFpcd, long nStartPos = -1 ); + long GetIdx() const { return nIdx; } + void SetIdx( long nI ) { nIdx = nI; } + long GetIMax() const { return rPLCF.nIMax; } + bool SeekPos(long nPos); + INT32 Where() const; + bool Get(WW8_CP& rStart, WW8_CP& rEnd, void*& rpValue) const; + WW8PLCFpcd_Iter& operator ++( int ) + { + if( nIdx < rPLCF.nIMax ) + nIdx++; + return *this; + } +}; + +// PLCF-Typ: +enum ePLCFT{ CHP=0, PAP, SEP, /*HED, FNR, ENR,*/ PLCF_END }; + +//Its hardcoded that eFTN be the first one: A very poor hack, needs to be fixed +enum eExtSprm { eFTN = 256, eEDN = 257, eFLD = 258, eBKN = 259, eAND = 260 }; + +/* + pure virtual: +*/ +class WW8PLCFx // virtueller Iterator fuer Piece Table Exceptions +{ +private: + ww::WordVersion meVer; // Version number of FIB + bool bIsSprm; // PLCF von Sprms oder von anderem ( Footnote, ... ) + WW8_FC nStartFc; + bool bDirty; + + //No copying + WW8PLCFx(const WW8PLCFx&); + WW8PLCFx& operator=(const WW8PLCFx&); +public: + WW8PLCFx(ww::WordVersion eVersion, bool bSprm) + : meVer(eVersion), bIsSprm(bSprm), bDirty(false) {} + virtual ~WW8PLCFx() {} + bool IsSprm() const { return bIsSprm; } + virtual ULONG GetIdx() const = 0; + virtual void SetIdx( ULONG nIdx ) = 0; + virtual ULONG GetIdx2() const; + virtual void SetIdx2( ULONG nIdx ); + virtual bool SeekPos(WW8_CP nCpPos) = 0; + virtual WW8_FC Where() = 0; + virtual void GetSprms( WW8PLCFxDesc* p ); + virtual long GetNoSprms( WW8_CP& rStart, WW8_CP&, sal_Int32& rLen ); + virtual WW8PLCFx& operator ++( int ) = 0; + virtual USHORT GetIstd() const { return 0xffff; } + virtual void Save( WW8PLCFxSave1& rSave ) const; + virtual void Restore( const WW8PLCFxSave1& rSave ); + ww::WordVersion GetFIBVersion() const { return meVer; } + void SetStartFc( WW8_FC nFc ) { nStartFc = nFc; } + WW8_FC GetStartFc() const { return nStartFc; } + void SetDirty(bool bIn) {bDirty=bIn;} + bool GetDirty() const {return bDirty;} +}; + +class WW8PLCFx_PCDAttrs : public WW8PLCFx +{ +private: + WW8PLCFpcd_Iter* pPcdI; + WW8PLCFx_PCD* pPcd; + BYTE** const pGrpprls; // Attribute an Piece-Table + SVBT32 aShortSprm; // mini storage: can contain ONE sprm with + // 1 byte param + UINT16 nGrpprls; // Attribut Anzahl davon + + //No copying + WW8PLCFx_PCDAttrs(const WW8PLCFx_PCDAttrs&); + WW8PLCFx_PCDAttrs& operator=(const WW8PLCFx_PCDAttrs&); +public: + WW8PLCFx_PCDAttrs(ww::WordVersion eVersion, WW8PLCFx_PCD* pPLCFx_PCD, + const WW8ScannerBase* pBase ); + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nI ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + virtual void GetSprms( WW8PLCFxDesc* p ); + virtual WW8PLCFx& operator ++( int ); + + WW8PLCFpcd_Iter* GetIter() const { return pPcdI; } +}; + +class WW8PLCFx_PCD : public WW8PLCFx // Iterator fuer Piece Table +{ +private: + WW8PLCFpcd_Iter* pPcdI; + bool bVer67; + WW8_CP nClipStart; + + //No copying + WW8PLCFx_PCD(const WW8PLCFx_PCD&); + WW8PLCFx_PCD& operator=(const WW8PLCFx_PCD&); +public: + WW8PLCFx_PCD(ww::WordVersion eVersion, WW8PLCFpcd* pPLCFpcd, + WW8_CP nStartCp, bool bVer67P); + virtual ~WW8PLCFx_PCD(); + virtual ULONG GetIMax() const; + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nI ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + virtual long GetNoSprms( WW8_CP& rStart, WW8_CP&, sal_Int32& rLen ); + virtual WW8PLCFx& operator ++( int ); + WW8_CP AktPieceStartFc2Cp( WW8_FC nStartPos ); + WW8_FC AktPieceStartCp2Fc( WW8_CP nCp ); + void AktPieceFc2Cp(WW8_CP& rStartPos, WW8_CP& rEndPos, + const WW8ScannerBase *pSBase); + WW8PLCFpcd_Iter* GetPLCFIter() { return pPcdI; } + void SetClipStart(WW8_CP nIn) { nClipStart = nIn; } + WW8_CP GetClipStart() { return nClipStart; } + + static INT32 TransformPieceAddress(long nfc, bool& bIsUnicodeAddress) + { + bIsUnicodeAddress = 0 == (0x40000000 & nfc); + return bIsUnicodeAddress ? nfc : (nfc & 0x3fffFFFF) / 2; + } +}; + +/** + Iterator for Piece Table Exceptions of Fkps + works only with FCs, not with CPs ! ( Low-Level ) +*/ +class WW8PLCFx_Fc_FKP : public WW8PLCFx +{ +public: + class WW8Fkp // Iterator for Formatted Disk Page + { + private: + class Entry + { + public: + WW8_FC mnFC; + + sal_uInt8* mpData; + sal_uInt16 mnLen; + sal_uInt16 mnIStd; // only for Fkp.Papx (actualy Style-Nr) + bool mbMustDelete; + + explicit Entry(WW8_FC nFC) : mnFC(nFC), mpData(0), mnLen(0), + mnIStd(0), mbMustDelete(false) {} + Entry(const Entry &rEntry); + ~Entry(); + bool operator<(const Entry& rEntry) const; + Entry& operator=(const Entry& rEntry); + }; + + sal_uInt8 maRawData[512]; + std::vector<Entry> maEntries; + + long nItemSize; // entweder 1 Byte oder ein komplettes BX + + // Offset in Stream where last read of 52 bytes took place + long nFilePos; + sal_uInt8 mnIdx; // Pos-Merker + ePLCFT ePLCF; + sal_uInt8 mnIMax; // Anzahl der Eintraege + + wwSprmParser maSprmParser; + public: + WW8Fkp (ww::WordVersion eVersion, SvStream* pFKPStrm, + SvStream* pDataStrm, long _nFilePos, long nItemSiz, ePLCFT ePl, + WW8_FC nStartFc = -1); + void Reset(WW8_FC nPos); + long GetFilePos() const { return nFilePos; } + sal_uInt8 GetIdx() const { return mnIdx; } + bool SetIdx(sal_uInt8 nI); + bool SeekPos(WW8_FC nFc); + WW8_FC Where() const + { + return (mnIdx < mnIMax) ? maEntries[mnIdx].mnFC : WW8_FC_MAX; + } + WW8Fkp& operator ++( int ) + { + if (mnIdx < mnIMax) + mnIdx++; + return *this; + } + BYTE* Get( WW8_FC& rStart, WW8_FC& rEnd, sal_Int32& rLen ) const; + sal_uInt16 GetIstd() const { return maEntries[mnIdx].mnIStd; } + + /* + liefert einen echten Pointer auf das Sprm vom Typ nId, + falls ein solches im Fkp drin ist. + */ + BYTE* GetLenAndIStdAndSprms(sal_Int32& rLen) const; + + /* + ruft GetLenAndIStdAndSprms() auf... + */ + const BYTE* HasSprm( USHORT nId ); + bool HasSprm(USHORT nId, std::vector<const BYTE *> &rResult); + + const wwSprmParser &GetSprmParser() const { return maSprmParser; } + }; +private: + SvStream* pFKPStrm; // Input-File + SvStream* pDataStrm; // Input-File + WW8PLCF* pPLCF; + WW8Fkp* pFkp; + + /* + #100042# + Keep a cache of eMaxCache entries of previously seen pFkps, which + speeds up considerably table parsing and load save plcfs for what turn + out to be small text frames, which frames generally are + + size : cache hits + cache all : 19168 pap, 48 chp + == 100 : 19166 pap, 48 chp + == 50 : 18918 pap, 48 chp + == 10 : 18549 pap, 47 chp + == 5 : 18515 pap, 47 chp + */ + typedef std::list<WW8Fkp*>::iterator myiter; + std::list<WW8Fkp*> maFkpCache; + enum Limits {eMaxCache = 5}; + + bool NewFkp(); + + //No copying + WW8PLCFx_Fc_FKP(const WW8PLCFx_Fc_FKP&); + WW8PLCFx_Fc_FKP& operator=(const WW8PLCFx_Fc_FKP&); +protected: + ePLCFT ePLCF; + WW8PLCFx_PCDAttrs* pPCDAttrs; +public: + WW8PLCFx_Fc_FKP( SvStream* pSt, SvStream* pTblSt, SvStream* pDataSt, + const WW8Fib& rFib, ePLCFT ePl, WW8_FC nStartFcL ); + virtual ~WW8PLCFx_Fc_FKP(); + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nIdx ); + virtual bool SeekPos(WW8_FC nFcPos); + virtual WW8_FC Where(); + BYTE* GetSprmsAndPos( WW8_FC& rStart, WW8_FC& rEnd, sal_Int32& rLen ); + virtual WW8PLCFx& operator ++( int ); + virtual USHORT GetIstd() const; + void GetPCDSprms( WW8PLCFxDesc& rDesc ); + const BYTE* HasSprm( USHORT nId ); + bool HasSprm(USHORT nId, std::vector<const BYTE *> &rResult); + bool HasFkp() const { return (0 != pFkp); } +}; + +/// Iterator fuer Piece Table Exceptions of Fkps arbeitet auf CPs (High-Level) +class WW8PLCFx_Cp_FKP : public WW8PLCFx_Fc_FKP +{ +private: + const WW8ScannerBase& rSBase; + WW8PLCFx_PCD* pPcd; + WW8PLCFpcd_Iter *pPieceIter; + WW8_CP nAttrStart, nAttrEnd; + BYTE bLineEnd : 1; + BYTE bComplex : 1; + + //No copying + WW8PLCFx_Cp_FKP(const WW8PLCFx_Cp_FKP&); + WW8PLCFx_Cp_FKP& operator=(const WW8PLCFx_Cp_FKP&); +public: + WW8PLCFx_Cp_FKP( SvStream* pSt, SvStream* pTblSt, SvStream* pDataSt, + const WW8ScannerBase& rBase, ePLCFT ePl ); + virtual ~WW8PLCFx_Cp_FKP(); + void ResetAttrStartEnd(); + ULONG GetPCDIMax() const; + ULONG GetPCDIdx() const; + void SetPCDIdx( ULONG nIdx ); + virtual ULONG GetIdx2() const; + virtual void SetIdx2( ULONG nIdx ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_CP Where(); + virtual void GetSprms( WW8PLCFxDesc* p ); + virtual WW8PLCFx& operator ++( int ); + virtual void Save( WW8PLCFxSave1& rSave ) const; + virtual void Restore( const WW8PLCFxSave1& rSave ); +}; + +/// Iterator for Piece Table Exceptions of Sepx +class WW8PLCFx_SEPX : public WW8PLCFx +{ +private: + wwSprmParser maSprmParser; + SvStream* pStrm; + WW8PLCF* pPLCF; + BYTE* pSprms; + USHORT nArrMax; + UINT16 nSprmSiz; + + //no copying + WW8PLCFx_SEPX(const WW8PLCFx_SEPX&); + WW8PLCFx_SEPX& operator=(const WW8PLCFx_SEPX&); +public: + WW8PLCFx_SEPX( SvStream* pSt, SvStream* pTblxySt, const WW8Fib& rFib, + WW8_CP nStartCp ); + virtual ~WW8PLCFx_SEPX(); + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nIdx ); + long GetIMax() const { return ( pPLCF ) ? pPLCF->GetIMax() : 0; } + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + virtual void GetSprms( WW8PLCFxDesc* p ); + virtual WW8PLCFx& operator ++( int ); + const BYTE* HasSprm( USHORT nId ) const; + const BYTE* HasSprm( USHORT nId, BYTE n2nd ) const; + const BYTE* HasSprm( USHORT nId, const BYTE* pOtherSprms, + long nOtherSprmSiz ) const; + bool Find4Sprms(USHORT nId1, USHORT nId2, USHORT nId3, USHORT nId4, + BYTE*& p1, BYTE*& p2, BYTE*& p3, BYTE*& p4 ) const; +}; + +/// Iterator fuer Fuss-/Endnoten und Anmerkungen +class WW8PLCFx_SubDoc : public WW8PLCFx +{ +private: + WW8PLCF* pRef; + WW8PLCF* pTxt; + + //No copying + WW8PLCFx_SubDoc(const WW8PLCFx_SubDoc&); + WW8PLCFx_SubDoc& operator=(const WW8PLCFx_SubDoc&); +public: + WW8PLCFx_SubDoc(SvStream* pSt, ww::WordVersion eVersion, WW8_CP nStartCp, + long nFcRef, long nLenRef, long nFcTxt, long nLenTxt, long nStruc = 0); + virtual ~WW8PLCFx_SubDoc(); + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nIdx ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + + // liefert Reference Descriptoren + const void* GetData( long nIdx = -1 ) const + { + return pRef ? pRef->GetData( -1L == nIdx ? pRef->GetIdx() : nIdx ) : 0; + } + + //liefert Angabe, wo Kopf und Fusszeilen-Text zu finden ist + bool Get(long& rStart, void*& rpValue) const; + virtual void GetSprms(WW8PLCFxDesc* p); + virtual WW8PLCFx& operator ++( int ); + long Count() const { return ( pRef ) ? pRef->GetIMax() : 0; } +}; + +/// Iterator for footnotes and endnotes +class WW8PLCFx_FLD : public WW8PLCFx +{ +private: + WW8PLCFspecial* pPLCF; + const WW8Fib& rFib; + //No copying + WW8PLCFx_FLD(const WW8PLCFx_FLD&); + WW8PLCFx_FLD& operator=(const WW8PLCFx_FLD &); +public: + WW8PLCFx_FLD(SvStream* pSt, const WW8Fib& rMyFib, short nType); + virtual ~WW8PLCFx_FLD(); + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nIdx ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + virtual void GetSprms(WW8PLCFxDesc* p); + virtual WW8PLCFx& operator ++( int ); + bool StartPosIsFieldStart(); + bool EndPosIsFieldEnd(); + bool GetPara(long nIdx, WW8FieldDesc& rF); +}; + +enum eBookStatus { BOOK_NORMAL = 0, BOOK_IGNORE = 0x1, BOOK_FIELD = 0x2 }; + +/// Iterator for Booknotes +class WW8PLCFx_Book : public WW8PLCFx +{ +private: + WW8PLCFspecial* pBook[2]; // Start and End Position + ::std::vector<String> aBookNames; // Name + eBookStatus* pStatus; + long nIMax; // Number of Booknotes + USHORT nIsEnd; + int nBookmarkId; // counter incremented by GetUniqueBookmarkName. + + //No copying + WW8PLCFx_Book(const WW8PLCFx_Book&); + WW8PLCFx_Book& operator=(const WW8PLCFx_Book&); +public: + WW8PLCFx_Book(SvStream* pTblSt,const WW8Fib& rFib); + virtual ~WW8PLCFx_Book(); + long GetIMax() const { return nIMax; } + virtual ULONG GetIdx() const; + virtual void SetIdx( ULONG nI ); + virtual ULONG GetIdx2() const; + virtual void SetIdx2( ULONG nIdx ); + virtual bool SeekPos(WW8_CP nCpPos); + virtual WW8_FC Where(); + virtual long GetNoSprms( WW8_CP& rStart, WW8_CP& rEnd, sal_Int32& rLen ); + virtual WW8PLCFx& operator ++( int ); + const String* GetName() const; + WW8_CP GetStartPos() const + { return ( nIsEnd ) ? WW8_CP_MAX : pBook[0]->Where(); } + long GetLen() const; + bool GetIsEnd() const { return nIsEnd ? true : false; } + long GetHandle() const; + void SetStatus( USHORT nIndex, eBookStatus eStat ); + bool MapName(String& rName); + String GetBookmark(long nStart,long nEnd, USHORT &nIndex); + eBookStatus GetStatus() const; + String GetUniqueBookmarkName(String &suggestedName); +}; + +/* + hiermit arbeiten wir draussen: +*/ +struct WW8PLCFManResult +{ + WW8_CP nCpPos; // Attribut-Anfangsposition + long nMemLen; // Laenge dazu + long nCp2OrIdx; // footnote-textpos oder Index in PLCF + WW8_CP nAktCp; // wird nur vom Aufrufer benutzt + const BYTE* pMemPos;// Mem-Pos fuer Sprms + USHORT nSprmId; // Sprm-Id ( 0 = ungueltige Id -> ueberspringen! ) + // (2..255) oder Pseudo-Sprm-Id (256..260) + // bzw. ab Winword-Ver8 die Sprm-Id (800..) + BYTE nFlags; // Absatz- oder Section-Anfang +}; + +enum ManMaskTypes +{ + MAN_MASK_NEW_PAP = 1, // neue Zeile + MAN_MASK_NEW_SEP = 2 // neue Section +}; + +enum ManTypes // enums for PLCFMan-ctor +{ + MAN_MAINTEXT = 0, MAN_FTN = 1, MAN_EDN = 2, MAN_HDFT = 3, MAN_AND = 4, + MAN_TXBX = 5, MAN_TXBX_HDFT = 6 +}; + +/* + hiermit arbeitet der Manager drinnen: +*/ +struct WW8PLCFxDesc +{ + WW8PLCFx* pPLCFx; + ::std::stack<USHORT>* pIdStk; // Speicher fuer Attr-Id fuer Attr-Ende(n) + const BYTE* pMemPos;// wo liegen die Sprm(s) + long nOrigSprmsLen; + + WW8_CP nStartPos; + WW8_CP nEndPos; + + WW8_CP nOrigStartPos; + WW8_CP nOrigEndPos; // The ending character position of a paragraph is + // always one before the end reported in the FKP, + // also a character run that ends on the same location + // as the paragraph mark is adjusted to end just before + // the paragraph mark so as to handle their close + // first. The value being used to determing where the + // properties end is in nEndPos, but the original + // unadjusted end character position is important as + // it can be used as the beginning cp of the next set + // of properties + + WW8_CP nCp2OrIdx; // wo liegen die NoSprm(s) + sal_Int32 nSprmsLen; // wie viele Bytes fuer weitere Sprms / Laenge Fussnote + long nCpOfs; // fuer Offset Header .. Footnote + bool bFirstSprm; // fuer Erkennung erster Sprm einer Gruppe + bool bRealLineEnd; // false bei Pap-Piece-Ende + void Save( WW8PLCFxSave1& rSave ) const; + void Restore( const WW8PLCFxSave1& rSave ); + //With nStartPos set to WW8_CP_MAX then in the case of a pap or chp + //GetSprms will not search for the sprms, but instead take the + //existing ones. + WW8PLCFxDesc() : pIdStk(0), nStartPos(WW8_CP_MAX) {} + void ReduceByOffset(); +}; + +#ifndef DUMP + +struct WW8PLCFxSaveAll; +class WW8PLCFMan +{ +public: + enum WW8PLCFManLimits {MAN_ANZ_PLCF = 10}; +private: + wwSprmParser maSprmParser; + long nCpO; // Origin Cp -- the basis for nNewCp + + WW8_CP nLineEnd; // zeigt *hinter* das <CR> + long nLastWhereIdxCp; // last result of WhereIdx() + USHORT nPLCF; // so viele PLCFe werden verwaltet + ManTypes nManType; + bool mbDoingDrawTextBox; //Normally we adjust the end of attributes + //so that the end of a paragraph occurs + //before the para end mark, but for + //drawboxes we want the true offsets + + WW8PLCFxDesc aD[MAN_ANZ_PLCF]; + WW8PLCFxDesc *pChp, *pPap, *pSep, *pFld, *pFtn, *pEdn, *pBkm, *pPcd, + *pPcdA, *pAnd; + WW8PLCFspecial *pFdoa, *pTxbx, *pTxbxBkd,*pMagicTables, *pSubdocs; + BYTE* pExtendedAtrds; + + const WW8Fib* pWwFib; + + USHORT WhereIdx(bool* pbStart=0, long* pPos=0) const; + void AdjustEnds(WW8PLCFxDesc& rDesc); + void GetNewSprms(WW8PLCFxDesc& rDesc); + void GetNewNoSprms(WW8PLCFxDesc& rDesc); + void GetSprmStart(short nIdx, WW8PLCFManResult* pRes) const; + void GetSprmEnd(short nIdx, WW8PLCFManResult* pRes) const; + void GetNoSprmStart(short nIdx, WW8PLCFManResult* pRes) const; + void GetNoSprmEnd(short nIdx, WW8PLCFManResult* pRes) const; + void AdvSprm(short nIdx, bool bStart); + void AdvNoSprm(short nIdx, bool bStart); + USHORT GetId(const WW8PLCFxDesc* p ) const; +public: + WW8PLCFMan(WW8ScannerBase* pBase, ManTypes nType, long nStartCp, + bool bDoingDrawTextBox = false); + ~WW8PLCFMan(); + + /* + Where fragt, an welcher naechsten Position sich irgendein + Attr aendert... + */ + WW8_CP Where() const; + + bool Get(WW8PLCFManResult* pResult) const; + WW8PLCFMan& operator ++( int ); + USHORT GetColl() const; // index of actual Style + WW8PLCFx_FLD* GetFld() const; + WW8PLCFx_SubDoc* GetEdn() const { return (WW8PLCFx_SubDoc*)pEdn->pPLCFx; } + WW8PLCFx_SubDoc* GetFtn() const { return (WW8PLCFx_SubDoc*)pFtn->pPLCFx; } + WW8PLCFx_SubDoc* GetAtn() const { return (WW8PLCFx_SubDoc*)pAnd->pPLCFx; } + WW8PLCFx_Book* GetBook() const { return (WW8PLCFx_Book*)pBkm->pPLCFx; } + long GetCpOfs() const { return pChp->nCpOfs; } // for Header/Footer... + + /* fragt, ob *aktueller Absatz* einen Sprm diesen Typs hat */ + const BYTE* HasParaSprm( USHORT nId ) const; + + /* fragt, ob *aktueller Textrun* einen Sprm diesen Typs hat */ + const BYTE* HasCharSprm( USHORT nId ) const; + bool HasCharSprm(USHORT nId, std::vector<const BYTE *> &rResult) const; + + WW8PLCFx_Cp_FKP* GetChpPLCF() const + { return (WW8PLCFx_Cp_FKP*)pChp->pPLCFx; } + WW8PLCFx_Cp_FKP* GetPapPLCF() const + { return (WW8PLCFx_Cp_FKP*)pPap->pPLCFx; } + WW8PLCFx_SEPX* GetSepPLCF() const + { return (WW8PLCFx_SEPX*)pSep->pPLCFx; } + WW8PLCFxDesc* GetPap() const { return pPap; } + bool TransferOpenSprms(std::stack<USHORT> &rStack); + void SeekPos( long nNewCp ); + void SaveAllPLCFx( WW8PLCFxSaveAll& rSave ) const; + void RestoreAllPLCFx( const WW8PLCFxSaveAll& rSave ); + WW8PLCFspecial* GetFdoa() const { return pFdoa; } + WW8PLCFspecial* GetTxbx() const { return pTxbx; } + WW8PLCFspecial* GetTxbxBkd() const { return pTxbxBkd; } + WW8PLCFspecial* GetMagicTables() const { return pMagicTables; } + WW8PLCFspecial* GetWkbPLCF() const { return pSubdocs; } + BYTE* GetExtendedAtrds() const { return pExtendedAtrds; } + ManTypes GetManType() const { return nManType; } + bool GetDoingDrawTextBox() const { return mbDoingDrawTextBox; } +}; + +struct WW8PLCFxSaveAll +{ + WW8PLCFxSave1 aS[WW8PLCFMan::MAN_ANZ_PLCF]; +}; + +#endif // !DUMP + +class WW8ScannerBase +{ +friend WW8PLCFx_PCDAttrs::WW8PLCFx_PCDAttrs(ww::WordVersion eVersion, + WW8PLCFx_PCD* pPLCFx_PCD, const WW8ScannerBase* pBase ); +friend WW8PLCFx_Cp_FKP::WW8PLCFx_Cp_FKP( SvStream*, SvStream*, SvStream*, + const WW8ScannerBase&, ePLCFT ); + +#ifndef DUMP +friend WW8PLCFMan::WW8PLCFMan(WW8ScannerBase*, ManTypes, long, bool); +friend class SwWw8ImplReader; +friend class SwWW8FltControlStack; +#endif + +private: + const WW8Fib* pWw8Fib; + WW8PLCFx_Cp_FKP* pChpPLCF; // Character-Attrs + WW8PLCFx_Cp_FKP* pPapPLCF; // Para-Attrs + WW8PLCFx_SEPX* pSepPLCF; // Section-Attrs + WW8PLCFx_SubDoc* pFtnPLCF; // Footnotes + WW8PLCFx_SubDoc* pEdnPLCF; // EndNotes + WW8PLCFx_SubDoc* pAndPLCF; // Anmerkungen + WW8PLCFx_FLD* pFldPLCF; // Fields in Main Text + WW8PLCFx_FLD* pFldHdFtPLCF; // Fields in Header / Footer + WW8PLCFx_FLD* pFldTxbxPLCF; // Fields in Textboxes in Main Text + WW8PLCFx_FLD* pFldTxbxHdFtPLCF; // Fields in Textboxes in Header / Footer + WW8PLCFx_FLD* pFldFtnPLCF; // Fields in Footnotes + WW8PLCFx_FLD* pFldEdnPLCF; // Fields in Endnotes + WW8PLCFx_FLD* pFldAndPLCF; // Fields in Anmerkungen + WW8PLCFspecial* pMainFdoa; // Graphic Primitives in Main Text + WW8PLCFspecial* pHdFtFdoa; // Graphic Primitives in Header / Footer + WW8PLCFspecial* pMainTxbx; // Textboxen in Main Text + WW8PLCFspecial* pMainTxbxBkd; // Break-Deskriptoren fuer diese + WW8PLCFspecial* pHdFtTxbx; // TextBoxen in Header / Footer + WW8PLCFspecial* pHdFtTxbxBkd; // Break-Deskriptoren fuer diese + WW8PLCFspecial* pMagicTables; // Break-Deskriptoren fuer diese + WW8PLCFspecial* pSubdocs; // subdoc references in master document + BYTE* pExtendedAtrds; // Extended ATRDs + WW8PLCFx_Book* pBook; // Bookmarks + + WW8PLCFpcd* pPiecePLCF; // fuer FastSave ( Basis-PLCF ohne Iterator ) + WW8PLCFpcd_Iter* pPieceIter; // fuer FastSave ( Iterator dazu ) + WW8PLCFx_PCD* pPLCFx_PCD; // dito + WW8PLCFx_PCDAttrs* pPLCFx_PCDAttrs; + BYTE** pPieceGrpprls; // Attribute an Piece-Table + UINT16 nPieceGrpprls; // Anzahl davon + + WW8PLCFpcd* OpenPieceTable( SvStream* pStr, const WW8Fib* pWwF ); + void DeletePieceTable(); +public: + WW8ScannerBase( SvStream* pSt, SvStream* pTblSt, SvStream* pDataSt, + const WW8Fib* pWwF ); + ~WW8ScannerBase(); + bool AreThereFootnotes() const { return pFtnPLCF->Count() > 0; }; + bool AreThereEndnotes() const { return pEdnPLCF->Count() > 0; }; + + //If you use WW8Fc2Cp you are almost certainly doing the wrong thing + //when it comes to fastsaved files, avoid like the plague. For export + //given that we never write fastsaved files you can use it, otherwise + //I will beat you with a stick + WW8_CP WW8Fc2Cp(WW8_FC nFcPos) const ; + WW8_FC WW8Cp2Fc(WW8_CP nCpPos, bool* pIsUnicode = 0, + WW8_CP* pNextPieceCp = 0, bool* pTestFlag = 0) const; + + xub_StrLen WW8ReadString(SvStream& rStrm, String& rStr, WW8_CP nAktStartCp, + long nTotalLen, rtl_TextEncoding eEnc ) const; + +}; + +/** FIB - the File Information Block + + The FIB contains a "magic word" and pointers to the various other parts of + the file, as well as information about the length of the file. + The FIB starts at the beginning of the file. +*/ +class WW8Fib +{ +public: + /** + Program-Version asked for by us: + in Ctor we check if it matches the value of nFib + + 6 == "WinWord 6 or WinWord 95", + 7 == "only WinWord 95" + 8 == "WinWord 97 or newer" + */ + BYTE nVersion; + /* + error status + */ + ULONG nFibError; + /* + vom Ctor aus dem FIB gelesene Daten + (entspricht nur ungefaehr der tatsaechlichen Struktur + des Winword-FIB) + */ + UINT16 wIdent; // 0x0 int magic number + /* + File Information Block (FIB) values: + WinWord 1.0 = 33 + WinWord 2.0 = 45 + WinWord 6.0c for 16bit = 101 + Word 6/32 bit = 104 + Word 95 = 104 + Word 97 = 193 + Word 2000 = 217 + Word 2002 = 257 + Word 2003 = 268 + Word 2007 = 274 + */ + UINT16 nFib; // 0x2 FIB version written + UINT16 nProduct; // 0x4 product version written by + INT16 lid; // 0x6 language stamp---localized version; + WW8_PN pnNext; // 0x8 + + UINT16 fDot :1; // 0xa 0001 + UINT16 fGlsy :1; + UINT16 fComplex :1; // 0004 when 1, file is in complex, fast-saved format. + UINT16 fHasPic :1; // 0008 file contains 1 or more pictures + UINT16 cQuickSaves :4; // 00F0 count of times file was quicksaved + UINT16 fEncrypted :1; //0100 1 if file is encrypted, 0 if not + UINT16 fWhichTblStm :1; //0200 When 0, this fib refers to the table stream + UINT16 fReadOnlyRecommended :1; + UINT16 fWriteReservation :1; + // named "0Table", when 1, this fib refers to the + // table stream named "1Table". Normally, a file + // will have only one table stream, but under unusual + // circumstances a file may have table streams with + // both names. In that case, this flag must be used + // to decide which table stream is valid. + + UINT16 fExtChar :1; // 1000 =1, when using extended character set in file + UINT16 fFarEast :1; // 4000 =1, probably, when far-East language vaiants of Word is used to create a file #i90932# + + UINT16 fObfuscated :1; // 8000=1. specifies whether the document is obfuscated using XOR obfuscation. otherwise this bit MUST be ignored. + + UINT16 nFibBack; // 0xc + UINT16 nHash; // 0xe file encrypted hash + UINT16 nKey; // 0x10 file encrypted key + UINT8 envr; // 0x12 environment in which file was created + // 0 created by Win Word / 1 created by Mac Word + BYTE fMac :1; // 0x13 when 1, this file was last saved in the Mac environment + BYTE fEmptySpecial :1; + BYTE fLoadOverridePage :1; + BYTE fFuturesavedUndo :1; + BYTE fWord97Saved :1; + BYTE fWord2000Saved :1; + BYTE :2; + + UINT16 chse; // 0x14 default extended character set id for text in document stream. (overidden by chp.chse) + // 0 = ANSI / 256 Macintosh character set. + UINT16 chseTables; // 0x16 default extended character set id for text in + // internal data structures: 0 = ANSI, 256 = Macintosh + WW8_FC fcMin; // 0x18 file offset of first character of text + WW8_FC fcMac; // 0x1c file offset of last character of text + 1 + + // Einschub fuer WW8 ***************************************************** + UINT16 csw; // Count of fields in the array of "shorts" + + // Marke: "rgsw" Beginning of the array of shorts + UINT16 wMagicCreated; // unique number Identifying the File's creator + // 0x6A62 is the creator ID for Word and is reserved. + // Other creators should choose a different value. + UINT16 wMagicRevised; // identifies the File's last modifier + UINT16 wMagicCreatedPrivate; // private data + UINT16 wMagicRevisedPrivate; // private data + /* + INT16 pnFbpChpFirst_W6; // not used + INT16 pnChpFirst_W6; // not used + INT16 cpnBteChp_W6; // not used + INT16 pnFbpPapFirst_W6; // not used + INT16 pnPapFirst_W6; // not used + INT16 cpnBtePap_W6; // not used + INT16 pnFbpLvcFirst_W6; // not used + INT16 pnLvcFirst_W6; // not used + INT16 cpnBteLvc_W6; // not used + */ + INT16 lidFE; // Language id if document was written by Far East version + // of Word (i.e. FIB.fFarEast is on) + UINT16 clw; // Number of fields in the array of longs + + // Ende des Einschubs fuer WW8 ******************************************* + + // Marke: "rglw" Beginning of the array of longs + WW8_FC cbMac; // 0x20 file offset of last byte written to file + 1. + + // WW8_FC u4[4]; // 0x24 + WW8_CP ccpText; // 0x34 length of main document text stream + WW8_CP ccpFtn; // 0x38 length of footnote subdocument text stream + WW8_CP ccpHdr; // 0x3c length of header subdocument text stream + WW8_CP ccpMcr; // 0x40 length of macro subdocument text stream + WW8_CP ccpAtn; // 0x44 length of annotation subdocument text stream + WW8_CP ccpEdn; // 0x48 length of endnote subdocument text stream + WW8_CP ccpTxbx; // 0x4c length of textbox subdocument text stream + WW8_CP ccpHdrTxbx; // 0x50 length of header textbox subdocument text stream + + // Einschub fuer WW8 ***************************************************** + INT32 pnFbpChpFirst; // when there was insufficient memory for Word to expand + // the PLCFbte at save time, the PLCFbte is written + // to the file in a linked list of 512-byte pieces + // starting with this pn. + /* + // folgende Felder existieren zwar so in der Datei, + // wir benutzen jedoch unten deklarierte General-Variablen + // fuer Ver67 und Ver8 gemeinsam. + INT32 pnChpFirst; // the page number of the lowest numbered page in the + // document that records CHPX FKP information + INT32 cpnBteChp; // count of CHPX FKPs recorded in file. In non-complex + // files if the number of entries in the PLCFbteChpx + // is less than this, the PLCFbteChpx is incomplete. + */ + INT32 pnFbpPapFirst; // when there was insufficient memory for Word to expand + // the PLCFbte at save time, the PLCFbte is written to + // the file in a linked list of 512-byte pieces + // starting with this pn + /* + // folgende Felder existieren zwar so in der Datei, + // wir benutzen jedoch unten deklarierte General-Variablen + // fuer Ver67 und Ver8 gemeinsam. + INT32 pnPapFirst; // the page number of the lowest numbered page in the + // document that records PAPX FKP information + INT32 cpnBtePap; // count of PAPX FKPs recorded in file. In non-complex + // files if the number of entries in the PLCFbtePapx is + // less than this, the PLCFbtePapx is incomplete. + */ + INT32 pnFbpLvcFirst; // when there was insufficient memory for Word to expand + // the PLCFbte at save time, the PLCFbte is written to + // the file in a linked list of 512-byte pieces + // starting with this pn + INT32 pnLvcFirst; // the page number of the lowest numbered page in the + // document that records LVC FKP information + INT32 cpnBteLvc; // count of LVC FKPs recorded in file. In non-complex + // files if the number of entries in the PLCFbtePapx is + // less than this, the PLCFbtePapx is incomplete. + INT32 fcIslandFirst; // ? + INT32 fcIslandLim; // ? + UINT16 cfclcb; // Number of fields in the array of FC/LCB pairs. + + // Ende des Einschubs fuer WW8 ******************************************* + + // Marke: "rgfclcb" Beginning of array of FC/LCB pairs. + WW8_FC fcStshfOrig; // file offset of original allocation for STSH in table + // stream. During fast save Word will attempt to reuse + // this allocation if STSH is small enough to fit. + INT32 lcbStshfOrig; // 0x5c count of bytes of original STSH allocation + WW8_FC fcStshf; // 0x60 file offset of STSH in file. + INT32 lcbStshf; // 0x64 count of bytes of current STSH allocation + WW8_FC fcPlcffndRef; // 0x68 file offset of footnote reference PLCF. + INT32 lcbPlcffndRef; // 0x6c count of bytes of footnote reference PLCF + // == 0 if no footnotes defined in document. + + WW8_FC fcPlcffndTxt; // 0x70 file offset of footnote text PLCF. + INT32 lcbPlcffndTxt; // 0x74 count of bytes of footnote text PLCF. + // == 0 if no footnotes defined in document + + WW8_FC fcPlcfandRef; // 0x78 file offset of annotation reference PLCF. + INT32 lcbPlcfandRef; // 0x7c count of bytes of annotation reference PLCF. + + WW8_FC fcPlcfandTxt; // 0x80 file offset of annotation text PLCF. + INT32 lcbPlcfandTxt; // 0x84 count of bytes of the annotation text PLCF + + WW8_FC fcPlcfsed; // 8x88 file offset of section descriptor PLCF. + INT32 lcbPlcfsed; // 0x8c count of bytes of section descriptor PLCF. + + WW8_FC fcPlcfpad; // 0x90 file offset of paragraph descriptor PLCF + INT32 lcbPlcfpad; // 0x94 count of bytes of paragraph descriptor PLCF. + // ==0 if file was never viewed in Outline view. + // Should not be written by third party creators + + WW8_FC fcPlcfphe; // 0x98 file offset of PLCF of paragraph heights. + INT32 lcbPlcfphe; // 0x9c count of bytes of paragraph height PLCF. + // ==0 when file is non-complex. + + WW8_FC fcSttbfglsy; // 0xa0 file offset of glossary string table. + INT32 lcbSttbfglsy; // 0xa4 count of bytes of glossary string table. + // == 0 for non-glossary documents. + // !=0 for glossary documents. + + WW8_FC fcPlcfglsy; // 0xa8 file offset of glossary PLCF. + INT32 lcbPlcfglsy; // 0xac count of bytes of glossary PLCF. + // == 0 for non-glossary documents. + // !=0 for glossary documents. + + WW8_FC fcPlcfhdd; // 0xb0 byte offset of header PLCF. + INT32 lcbPlcfhdd; // 0xb4 count of bytes of header PLCF. + // == 0 if document contains no headers + + WW8_FC fcPlcfbteChpx; // 0xb8 file offset of character property bin table.PLCF. + INT32 lcbPlcfbteChpx;// 0xbc count of bytes of character property bin table PLCF. + + WW8_FC fcPlcfbtePapx; // 0xc0 file offset of paragraph property bin table.PLCF. + INT32 lcbPlcfbtePapx;// 0xc4 count of bytes of paragraph property bin table PLCF. + + WW8_FC fcPlcfsea; // 0xc8 file offset of PLCF reserved for private use. The SEA is 6 bytes long. + INT32 lcbPlcfsea; // 0xcc count of bytes of private use PLCF. + + WW8_FC fcSttbfffn; // 0xd0 file offset of font information STTBF. See the FFN file structure definition. + INT32 lcbSttbfffn; // 0xd4 count of bytes in sttbfffn. + + WW8_FC fcPlcffldMom; // 0xd8 offset in doc stream to the PLCF of field positions in the main document. + INT32 lcbPlcffldMom; // 0xdc + + WW8_FC fcPlcffldHdr; // 0xe0 offset in doc stream to the PLCF of field positions in the header subdocument. + INT32 lcbPlcffldHdr; // 0xe4 + + WW8_FC fcPlcffldFtn; // 0xe8 offset in doc stream to the PLCF of field positions in the footnote subdocument. + INT32 lcbPlcffldFtn; // 0xec + + WW8_FC fcPlcffldAtn; // 0xf0 offset in doc stream to the PLCF of field positions in the annotation subdocument. + INT32 lcbPlcffldAtn; // 0xf4 + + WW8_FC fcPlcffldMcr; // 0xf8 offset in doc stream to the PLCF of field positions in the macro subdocument. + INT32 lcbPlcffldMcr; // 9xfc + + WW8_FC fcSttbfbkmk; // 0x100 offset in document stream of the STTBF that records bookmark names in the main document + INT32 lcbSttbfbkmk; // 0x104 + + WW8_FC fcPlcfbkf; // 0x108 offset in document stream of the PLCF that records the beginning CP offsets of bookmarks in the main document. See BKF + INT32 lcbPlcfbkf; // 0x10c + + WW8_FC fcPlcfbkl; // 0x110 offset in document stream of the PLCF that records the ending CP offsets of bookmarks recorded in the main document. See the BKL structure definition. + INT32 lcbPlcfbkl; // 0x114 INT32 + + WW8_FC fcCmds; // 0x118 FC + INT32 lcbCmds; // 0x11c + + WW8_FC fcPlcfmcr; // 0x120 FC + INT32 lcbPlcfmcr; // 0x124 + + WW8_FC fcSttbfmcr; // 0x128 FC + INT32 lcbSttbfmcr; // 0x12c + + WW8_FC fcPrDrvr; // 0x130 file offset of the printer driver information (names of drivers, port etc...) + INT32 lcbPrDrvr; // 0x134 count of bytes of the printer driver information (names of drivers, port etc...) + + WW8_FC fcPrEnvPort; // 0x138 file offset of the print environment in portrait mode. + INT32 lcbPrEnvPort; // 0x13c count of bytes of the print environment in portrait mode. + + WW8_FC fcPrEnvLand; // 0x140 file offset of the print environment in landscape mode. + INT32 lcbPrEnvLand; // 0x144 count of bytes of the print environment in landscape mode. + + WW8_FC fcWss; // 0x148 file offset of Window Save State data structure. See WSS. + INT32 lcbWss; // 0x14c count of bytes of WSS. ==0 if unable to store the window state. + + WW8_FC fcDop; // 0x150 file offset of document property data structure. + sal_uInt32 lcbDop; // 0x154 count of bytes of document properties. + // cbDOP is 84 when nFib < 103 + + + WW8_FC fcSttbfAssoc; // 0x158 offset to STTBF of associated strings. See STTBFASSOC. + INT32 lcbSttbfAssoc; // 0x15C + + WW8_FC fcClx; // 0x160 file offset of beginning of information for complex files. + INT32 lcbClx; // 0x164 count of bytes of complex file information. 0 if file is non-complex. + + WW8_FC fcPlcfpgdFtn; // 0x168 file offset of page descriptor PLCF for footnote subdocument. + INT32 lcbPlcfpgdFtn; // 0x16C count of bytes of page descriptor PLCF for footnote subdocument. + // ==0 if document has not been paginated. The length of the PGD is 8 bytes. + + WW8_FC fcAutosaveSource; // 0x170 file offset of the name of the original file. + INT32 lcbAutosaveSource; // 0x174 count of bytes of the name of the original file. + + WW8_FC fcGrpStAtnOwners; // 0x178 group of strings recording the names of the owners of annotations + INT32 lcbGrpStAtnOwners; // 0x17C count of bytes of the group of strings + + WW8_FC fcSttbfAtnbkmk; // 0x180 file offset of the sttbf that records names of bookmarks in the annotation subdocument + INT32 lcbSttbfAtnbkmk; // 0x184 length in bytes of the sttbf that records names of bookmarks in the annotation subdocument + + // Einschubs fuer WW67 *************************************************** + + // INT16 wSpare4Fib; // Reserve, muss hier nicht deklariert werden + + /* + // folgende Felder existieren zwar so in der Datei, + // wir benutzen jedoch unten deklarierte General-Variablen + // fuer Ver67 und Ver8 gemeinsam. + WW8_PN pnChpFirst; // the page number of the lowest numbered page in + // the document that records CHPX FKP information + WW8_PN pnPapFirst; // the page number of the lowest numbered page in + // the document that records PAPX FKP information + + WW8_PN cpnBteChp; // count of CHPX FKPs recorded in file. In non-complex + // files if the number of entries in the PLCFbteChpx is + // less than this, the PLCFbteChpx is incomplete. + WW8_PN cpnBtePap; // count of PAPX FKPs recorded in file. In non-complex + // files if the number of entries in the PLCFbtePapx is + // less than this, the PLCFbtePapx is incomplete. + */ + + // Ende des Einschubs fuer WW67 ****************************************** + + WW8_FC fcPlcfdoaMom; // 0x192 file offset of the FDOA (drawn object) PLCF for main document. + // ==0 if document has no drawn objects. The length of the FDOA is 6 bytes. + // ab Ver8 unused + INT32 lcbPlcfdoaMom; // 0x196 length in bytes of the FDOA PLCF of the main document + // ab Ver8 unused + WW8_FC fcPlcfdoaHdr; // 0x19A file offset of the FDOA (drawn object) PLCF for the header document. + // ==0 if document has no drawn objects. The length of the FDOA is 6 bytes. + // ab Ver8 unused + INT32 lcbPlcfdoaHdr; // 0x19E length in bytes of the FDOA PLCF of the header document + // ab Ver8 unused + + WW8_FC fcPlcfspaMom; // offset in table stream of the FSPA PLCF for main document. + // == 0 if document has no office art objects + // war in Ver67 nur leere Reserve + INT32 lcbPlcfspaMom; // length in bytes of the FSPA PLCF of the main document + // war in Ver67 nur leere Reserve + WW8_FC fcPlcfspaHdr; // offset in table stream of the FSPA PLCF for header document. + // == 0 if document has no office art objects + // war in Ver67 nur leere Reserve + INT32 lcbPlcfspaHdr; // length in bytes of the FSPA PLCF of the header document + // war in Ver67 nur leere Reserve + + WW8_FC fcPlcfAtnbkf; // 0x1B2 file offset of BKF (bookmark first) PLCF of the annotation subdocument + INT32 lcbPlcfAtnbkf; // 0x1B6 length in bytes of BKF (bookmark first) PLCF of the annotation subdocument + + WW8_FC fcPlcfAtnbkl; // 0x1BA file offset of BKL (bookmark last) PLCF of the annotation subdocument + INT32 lcbPlcfAtnbkl; // 0x1BE length in bytes of BKL (bookmark first) PLCF of the annotation subdocument + + WW8_FC fcPms; // 0x1C2 file offset of PMS (Print Merge State) information block + INT32 lcbPMS; // 0x1C6 length in bytes of PMS + + WW8_FC fcFormFldSttbf; // 0x1CA file offset of form field Sttbf which contains strings used in form field dropdown controls + INT32 lcbFormFldSttbf; // 0x1CE length in bytes of form field Sttbf + + WW8_FC fcPlcfendRef; // 0x1D2 file offset of PLCFendRef which points to endnote references in the main document stream + INT32 lcbPlcfendRef; // 0x1D6 + + WW8_FC fcPlcfendTxt; // 0x1DA file offset of PLCFendRef which points to endnote text in the endnote document + // stream which corresponds with the PLCFendRef + INT32 lcbPlcfendTxt; // 0x1DE + + WW8_FC fcPlcffldEdn; // 0x1E2 offset to PLCF of field positions in the endnote subdoc + INT32 lcbPlcffldEdn; // 0x1E6 + + WW8_FC fcPlcfpgdEdn; // 0x1EA offset to PLCF of page boundaries in the endnote subdoc. + INT32 lcbPlcfpgdEdn; // 0x1EE + + + WW8_FC fcDggInfo; // offset in table stream of the office art object table data. + // The format of office art object table data is found in a separate document. + // war in Ver67 nur leere Reserve + INT32 lcbDggInfo; // length in bytes of the office art object table data + // war in Ver67 nur leere Reserve + + WW8_FC fcSttbfRMark; // 0x1fa offset to STTBF that records the author abbreviations... + INT32 lcbSttbfRMark; // 0x1fe + WW8_FC fcSttbfCaption; // 0x202 offset to STTBF that records caption titles... + INT32 lcbSttbfCaption; // 0x206 + WW8_FC fcSttbAutoCaption; // offset in table stream to the STTBF that records the object names and + // indices into the caption STTBF for objects which get auto captions. + INT32 lcbSttbAutoCaption; // 0x20e + + WW8_FC fcPlcfwkb; // 0x212 offset to PLCF that describes the boundaries of contributing documents... + INT32 lcbPlcfwkb; // 0x216 + + WW8_FC fcPlcfspl; // offset in table stream of PLCF (of SPLS structures) that records spell check state + // war in Ver67 nur leere Reserve + INT32 lcbPlcfspl; // war in Ver67 nur leere Reserve + + WW8_FC fcPlcftxbxTxt; // 0x222 ...PLCF of beginning CP in the text box subdoc + INT32 lcbPlcftxbxTxt; // 0x226 + WW8_FC fcPlcffldTxbx; // 0x22a ...PLCF of field boundaries recorded in the textbox subdoc. + INT32 lcbPlcffldTxbx; // 0x22e + WW8_FC fcPlcfHdrtxbxTxt;// 0x232 ...PLCF of beginning CP in the header text box subdoc + INT32 lcbPlcfHdrtxbxTxt;// 0x236 + WW8_FC fcPlcffldHdrTxbx;// 0x23a ...PLCF of field boundaries recorded in the header textbox subdoc. + INT32 lcbPlcffldHdrTxbx;// 0x23e + WW8_FC fcStwUser; + sal_uInt32 lcbStwUser; + WW8_FC fcSttbttmbd; + sal_uInt32 lcbSttbttmbd; + + WW8_FC fcSttbFnm; // 0x02da offset in the table stream of masters subdocument names + INT32 lcbSttbFnm; // 0x02de length + + /* + spezielle Listenverwaltung fuer WW8 + */ + WW8_FC fcPlcfLst; // 0x02e2 offset in the table stream of list format information. + INT32 lcbPlcfLst; // 0x02e6 length + WW8_FC fcPlfLfo; // 0x02ea offset in the table stream of list format override information. + INT32 lcbPlfLfo; // 0x02ee length + /* + spezielle Break-Verwaltung fuer Text-Box-Stories in WW8 + */ + WW8_FC fcPlcftxbxBkd; // 0x02f2 PLCF fuer TextBox-Break-Deskriptoren im Maintext + INT32 lcbPlcftxbxBkd; // 0x02f6 + WW8_FC fcPlcfHdrtxbxBkd;// 0x02fa PLCF fuer TextBox-Break-Deskriptoren im Header-/Footer-Bereich + INT32 lcbPlcfHdrtxbxBkd;// 0x02fe + + // 0x302 - 372 == ignore + /* + ListNames (skip to here!) + */ + WW8_FC fcSttbListNames;// 0x0372 PLCF for Listname Table + INT32 lcbSttbListNames;// 0x0376 + + WW8_FC fcPlcfTch; + INT32 lcbPlcfTch; + + // 0x38A - 41A == ignore + WW8_FC fcAtrdExtra; + UINT32 lcbAtrdExtra; + + // 0x422 - 0x4D4 == ignore + WW8_FC fcHplxsdr; //bizarrely, word xp seems to require this set to shows dates from AtrdExtra + UINT32 lcbHplxsdr; + + /* + General-Varaiblen, die fuer Ver67 und Ver8 verwendet werden, + obwohl sie in der jeweiligen DATEI verschiedene Groesse haben: + */ + INT32 pnChpFirst; + INT32 pnPapFirst; + INT32 cpnBteChp; + INT32 cpnBtePap; + /* + The actual nFib, moved here because some readers assumed + they couldn't read any format with nFib > some constant + */ + UINT16 nFib_actual; // 0x05bc #i56856# + /* + nun wird lediglich noch ein Ctor benoetigt + */ + WW8Fib( SvStream& rStrm, BYTE nWantedVersion,UINT32 nOffset=0 ); + + /* leider falsch, man braucht auch noch einen fuer den Export */ + WW8Fib( BYTE nVersion = 6 ); + bool WriteHeader(SvStream& rStrm); + bool Write(SvStream& rStrm); + static rtl_TextEncoding GetFIBCharset(UINT16 chs); + ww::WordVersion GetFIBVersion() const; + WW8_CP GetBaseCp(ManTypes nType) const; +}; + +class WW8Style +{ +protected: + WW8Fib& rFib; + SvStream& rSt; + long nStyleStart; + long nStyleLen; + + UINT16 cstd; // Count of styles in stylesheet + UINT16 cbSTDBaseInFile; // Length of STD Base as stored in a file + UINT16 fStdStylenamesWritten : 1; // Are built-in stylenames stored? + UINT16 : 15; // Spare flags + UINT16 stiMaxWhenSaved; // Max sti known when file was written + UINT16 istdMaxFixedWhenSaved; // How many fixed-index istds are there? + UINT16 nVerBuiltInNamesWhenSaved; // Current version of built-in stylenames + // ftc used by StandardChpStsh for this document + UINT16 ftcStandardChpStsh; + // CJK ftc used by StandardChpStsh for this document + UINT16 ftcStandardChpCJKStsh; + // CTL ftc used by StandardChpStsh for this document + UINT16 ftcStandardChpCTLStsh; + + //No copying + WW8Style(const WW8Style&); + WW8Style& operator=(const WW8Style&); +public: + WW8Style( SvStream& rSt, WW8Fib& rFibPara ); + WW8_STD* Read1STDFixed( short& rSkip, short* pcbStd ); + WW8_STD* Read1Style( short& rSkip, String* pString, short* pcbStd ); + UINT16 GetCount() const { return cstd; } +}; + +class WW8Fonts +{ +protected: + WW8_FFN* pFontA; // Array of Pointers to Font Description + USHORT nMax; // Array-Size +public: + WW8Fonts( SvStream& rSt, WW8Fib& rFib ); + ~WW8Fonts() { delete[] pFontA; } + const WW8_FFN* GetFont( USHORT nNum ) const; + USHORT GetMax() const { return nMax; } +}; + +typedef BYTE HdFtFlags; +namespace nsHdFtFlags +{ + const HdFtFlags WW8_HEADER_EVEN = 0x01; + const HdFtFlags WW8_HEADER_ODD = 0x02; + const HdFtFlags WW8_FOOTER_EVEN = 0x04; + const HdFtFlags WW8_FOOTER_ODD = 0x08; + const HdFtFlags WW8_HEADER_FIRST = 0x10; + const HdFtFlags WW8_FOOTER_FIRST = 0x20; +} + +/// Document Properties +class WW8Dop +{ +public: + /* Error Status */ + ULONG nDopError; + /* + Corresponds only roughly to the actual structure of the Winword DOP, + the winword FIB version matters to what exists. + */ + // Initialisier-Dummy: + BYTE nDataStart; + //------------------------- + UINT16 fFacingPages : 1; // 1 when facing pages should be printed + UINT16 fWidowControl : 1; // 1 when widow control is in effect. 0 when widow control disabled. + UINT16 fPMHMainDoc : 1; // 1 when doc is a main doc for Print Merge Helper, 0 when not; default=0 + UINT16 grfSuppression : 2; // 0 Default line suppression storage; 0= form letter line suppression; 1= no line suppression; default=0 + UINT16 fpc : 2; // 1 footnote position code: 0 as endnotes, 1 at bottom of page, 2 immediately beneath text + UINT16 : 1; // 0 unused + //------------------------- + UINT16 grpfIhdt : 8; // 0 specification of document headers and footers. See explanation under Headers and Footers topic. + //------------------------- + UINT16 rncFtn : 2; // 0 restart index for footnotes, 0 don't restart note numbering, 1 section, 2 page + UINT16 nFtn : 14; // 1 initial footnote number for document + UINT16 fOutlineDirtySave : 1; // when 1, indicates that information in the hPLCFpad should be refreshed since outline has been dirtied + UINT16 : 7; // reserved + UINT16 fOnlyMacPics : 1; // when 1, Word believes all pictures recorded in the document were created on a Macintosh + UINT16 fOnlyWinPics : 1; // when 1, Word believes all pictures recorded in the document were created in Windows + UINT16 fLabelDoc : 1; // when 1, document was created as a print merge labels document + UINT16 fHyphCapitals : 1; // when 1, Word is allowed to hyphenate words that are capitalized. When 0, capitalized may not be hyphenated + UINT16 fAutoHyphen : 1; // when 1, Word will hyphenate newly typed text as a background task + UINT16 fFormNoFields : 1; + UINT16 fLinkStyles : 1; // when 1, Word will merge styles from its template + UINT16 fRevMarking : 1; // when 1, Word will mark revisions as the document is edited + UINT16 fBackup : 1; // always make backup when document saved when 1. + UINT16 fExactCWords : 1; + UINT16 fPagHidden : 1; // + UINT16 fPagResults : 1; + UINT16 fLockAtn : 1; // when 1, annotations are locked for editing + UINT16 fMirrorMargins : 1; // swap margins on left/right pages when 1. + UINT16 fReadOnlyRecommended : 1;// user has recommended that this doc be opened read-only when 1 + UINT16 fDfltTrueType : 1; // when 1, use TrueType fonts by default (flag obeyed only when doc was created by WinWord 2.x) + UINT16 fPagSuppressTopSpacing : 1;//when 1, file created with SUPPRESSTOPSPACING=YES in win.ini. (flag obeyed only when doc was created by WinWord 2.x). + UINT16 fProtEnabled : 1; // when 1, document is protected from edit operations + UINT16 fDispFormFldSel : 1;// when 1, restrict selections to occur only within form fields + UINT16 fRMView : 1; // when 1, show revision markings on screen + UINT16 fRMPrint : 1; // when 1, print revision marks when document is printed + UINT16 fWriteReservation : 1; + UINT16 fLockRev : 1; // when 1, the current revision marking state is locked + UINT16 fEmbedFonts : 1; // when 1, document contains embedded True Type fonts + // compatability options + UINT16 copts_fNoTabForInd : 1; // when 1, don�t add automatic tab stops for hanging indent + UINT16 copts_fNoSpaceRaiseLower : 1; // when 1, don�t add extra space for raised or lowered characters + UINT16 copts_fSupressSpbfAfterPgBrk : 1; // when 1, supress the paragraph Space Before and Space After options after a page break + UINT16 copts_fWrapTrailSpaces : 1; // when 1, wrap trailing spaces at the end of a line to the next line + UINT16 copts_fMapPrintTextColor : 1; // when 1, print colors as black on non-color printers + UINT16 copts_fNoColumnBalance : 1; // when 1, don�t balance columns for Continuous Section starts + UINT16 copts_fConvMailMergeEsc : 1; + UINT16 copts_fSupressTopSpacing : 1; // when 1, supress extra line spacing at top of page + UINT16 copts_fOrigWordTableRules : 1; // when 1, combine table borders like Word 5.x for the Macintosh + UINT16 copts_fTransparentMetafiles : 1; // when 1, don�t blank area between metafile pictures + UINT16 copts_fShowBreaksInFrames : 1; // when 1, show hard page or column breaks in frames + UINT16 copts_fSwapBordersFacingPgs : 1; // when 1, swap left and right pages on odd facing pages + UINT16 copts_fExpShRtn : 1; // when 1, expand character spaces on the line ending SHIFT+RETURN // #i56856# + + INT16 dxaTab; // 720 twips default tab width + UINT16 wSpare; // + UINT16 dxaHotZ; // width of hyphenation hot zone measured in twips + UINT16 cConsecHypLim; // number of lines allowed to have consecutive hyphens + UINT16 wSpare2; // reserved + INT32 dttmCreated; // DTTM date and time document was created + INT32 dttmRevised; // DTTM date and time document was last revised + INT32 dttmLastPrint; // DTTM date and time document was last printed + INT16 nRevision; // number of times document has been revised since its creation + INT32 tmEdited; // time document was last edited + INT32 cWords; // count of words tallied by last Word Count execution + INT32 cCh; // count of characters tallied by last Word Count execution + INT16 cPg; // count of pages tallied by last Word Count execution + INT32 cParas; // count of paragraphs tallied by last Word Count execution + UINT16 rncEdn : 2; // restart endnote number code: 0 don�t restart endnote numbering, 1 section, 2 page + UINT16 nEdn : 14; // beginning endnote number + UINT16 epc : 2; // endnote position code: 0 at end of section, 3 at end of document + // UINT16 nfcFtnRef : 4; // number format code for auto footnotes: 0 Arabic, 1 Upper case Roman, 2 Lower case Roman + // 3 Upper case Letter, 4 Lower case Letter + // ersetzt durch gleichlautendes Feld unten + // UINT16 nfcEdnRef : 4; // number format code for auto endnotes: 0 Arabic, 1 Upper case Roman, 2 Lower case Roman + // 3 Upper case Letter, 4 Lower case Letter + // ersetzt durch gleichlautendes Feld unten + UINT16 fPrintFormData : 1; // only print data inside of form fields + UINT16 fSaveFormData : 1; // only save document data that is inside of a form field. + UINT16 fShadeFormData : 1; // shade form fields + UINT16 : 2; // reserved + UINT16 fWCFtnEdn : 1; // when 1, include footnotes and endnotes in word count + INT32 cLines; // count of lines tallied by last Word Count operation + INT32 cWordsFtnEnd; // count of words in footnotes and endnotes tallied by last Word Count operation + INT32 cChFtnEdn; // count of characters in footnotes and endnotes tallied by last Word Count operation + INT16 cPgFtnEdn; // count of pages in footnotes and endnotes tallied by last Word Count operation + INT32 cParasFtnEdn; // count of paragraphs in footnotes and endnotes tallied by last Word Count operation + INT32 cLinesFtnEdn; // count of paragraphs in footnotes and endnotes tallied by last Word Count operation + INT32 lKeyProtDoc; // document protection password key, only valid if dop.fProtEnabled, dop.fLockAtn or dop.fLockRev are 1. + UINT16 wvkSaved : 3; // document view kind: 0 Normal view, 1 Outline view, 2 Page View + UINT16 wScaleSaved : 9; // + UINT16 zkSaved : 2; + UINT16 fRotateFontW6 : 1; + UINT16 iGutterPos : 1 ; + + // hier sollte bei nFib < 103 Schluss sein, sonst ist Datei fehlerhaft! + + /* + bei nFib >= 103 gehts weiter: + */ + UINT32 fNoTabForInd :1; // see above in compatability options + UINT32 fNoSpaceRaiseLower :1; // see above + UINT32 fSupressSpbfAfterPageBreak :1; // see above + UINT32 fWrapTrailSpaces :1; // see above + UINT32 fMapPrintTextColor :1; // see above + UINT32 fNoColumnBalance :1; // see above + UINT32 fConvMailMergeEsc :1; // see above + UINT32 fSupressTopSpacing :1; // see above + UINT32 fOrigWordTableRules :1; // see above + UINT32 fTransparentMetafiles :1; // see above + UINT32 fShowBreaksInFrames :1; // see above + UINT32 fSwapBordersFacingPgs :1; // see above + UINT32 fCompatabilityOptions_Unknown1_13 :1; // #i78591# + UINT32 fExpShRtn :1; // #i78591# and #i56856# + UINT32 fCompatabilityOptions_Unknown1_15 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_16 :1; // #i78591# + UINT32 fSuppressTopSpacingMac5 :1; // Suppress extra line spacing at top + // of page like MacWord 5.x + UINT32 fTruncDxaExpand :1; // Expand/Condense by whole number of points + UINT32 fPrintBodyBeforeHdr :1; // Print body text before header/footer + UINT32 fNoLeading :1; // Don't add extra spacebetween rows of text + UINT32 fCompatabilityOptions_Unknown1_21 :1; // #i78591# + UINT32 fMWSmallCaps : 1; // Use larger small caps like MacWord 5.x + UINT32 fCompatabilityOptions_Unknown1_23 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_24 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_25 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_26 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_27 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_28 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_29 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_30 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown1_31 :1; // #i78591# + UINT32 fUsePrinterMetrics : 1; //The magic option + + // hier sollte bei nFib <= 105 Schluss sein, sonst ist Datei fehlerhaft! + + /* + bei nFib > 105 gehts weiter: + */ + INT16 adt; // Autoformat Document Type: + // 0 for normal. + // 1 for letter, and + // 2 for email. + WW8DopTypography doptypography; // see WW8STRUC.HXX + WW8_DOGRID dogrid; // see WW8STRUC.HXX + UINT16 :1; // reserved + UINT16 lvl :4; // Which outline levels are showing in outline view + UINT16 :4; // reserved + UINT16 fHtmlDoc :1; // This file is based upon an HTML file + UINT16 :1; // reserved + UINT16 fSnapBorder :1; // Snap table and page borders to page border + UINT16 fIncludeHeader :1; // Place header inside page border + UINT16 fIncludeFooter :1; // Place footer inside page border + UINT16 fForcePageSizePag :1; // Are we in online view + UINT16 fMinFontSizePag :1; // Are we auto-promoting fonts to >= hpsZoonFontPag? + UINT16 fHaveVersions :1; // versioning is turned on + UINT16 fAutoVersion :1; // autoversioning is enabled + UINT16 : 14; // reserved + // Skip 12 Bytes here: ASUMI + INT32 cChWS; + INT32 cChWSFtnEdn; + INT32 grfDocEvents; + // Skip 4+30+8 Bytes here + INT32 cDBC; + INT32 cDBCFtnEdn; + // Skip 4 Bytes here + INT16 nfcFtnRef; + INT16 nfcEdnRef; + INT16 hpsZoonFontPag; + INT16 dywDispPag; + + UINT32 fCompatabilityOptions_Unknown2_1 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_2 :1; // #i78591# + UINT32 fDontUseHTMLAutoSpacing:1; + UINT32 fCompatabilityOptions_Unknown2_4 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_5 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_6 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_7 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_8 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_9 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_10 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_11 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_12 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_13 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_14 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_15 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_16 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_17 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_18 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_19 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_20 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_21 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_22 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_23 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_24 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_25 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_26 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_27 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_28 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_29 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_30 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_31 :1; // #i78591# + UINT32 fCompatabilityOptions_Unknown2_32 :1; // #i78591# + + UINT16 fUnknown3:15; + UINT16 fUseBackGroundInAllmodes:1; + + UINT16 fDoNotEmbedSystemFont:1; + UINT16 fWordCompat:1; + UINT16 fLiveRecover:1; + UINT16 fEmbedFactoids:1; + UINT16 fFactoidXML:1; + UINT16 fFactoidAllDone:1; + UINT16 fFolioPrint:1; + UINT16 fReverseFolio:1; + UINT16 iTextLineEnding:3; + UINT16 fHideFcc:1; + UINT16 fAcetateShowMarkup:1; + UINT16 fAcetateShowAtn:1; + UINT16 fAcetateShowInsDel:1; + UINT16 fAcetateShowProps:1; + + // 2. Initialisier-Dummy: + BYTE nDataEnd; + + bool bUseThaiLineBreakingRules; + + /* Constructor for importing, needs to know the version of word used */ + WW8Dop(SvStream& rSt, INT16 nFib, INT32 nPos, sal_uInt32 nSize); + + /* Constructs default DOP suitable for exporting */ + WW8Dop(); + bool Write(SvStream& rStrm, WW8Fib& rFib) const; +public: + UINT32 GetCompatabilityOptions() const; + void SetCompatabilityOptions(UINT32 a32Bit); + // i#78591# + UINT32 GetCompatabilityOptions2() const; + void SetCompatabilityOptions2(UINT32 a32Bit); +}; + +class WW8PLCF_HdFt +{ +private: + WW8PLCF aPLCF; + long nTextOfs; + short nIdxOffset; +public: + WW8PLCF_HdFt( SvStream* pSt, WW8Fib& rFib, WW8Dop& rDop ); + bool GetTextPos(BYTE grpfIhdt, BYTE nWhich, WW8_CP& rStart, long& rLen); + bool GetTextPosExact(short nIdx, WW8_CP& rStart, long& rLen); + void UpdateIndex( BYTE grpfIhdt ); +}; + +void SwapQuotesInField(String &rFmt); + +Word2CHPX ReadWord2Chpx(SvStream &rSt, sal_Size nOffset, sal_uInt8 nSize); +std::vector<BYTE> ChpxToSprms(const Word2CHPX &rChpx); + +ULONG SafeReadString(ByteString &rStr,USHORT nLen,SvStream &rStrm); + +//MS has a (slightly) inaccurate view of how many twips +//are in the default letter size of a page +const USHORT lLetterWidth = 12242; +const USHORT lLetterHeight = 15842; + +#endif + +/* vi:set tabstop=4 shiftwidth=4 expandtab: */ |