/* * (c) Copyright Ascensio System SIA 2010-2023 * * This program is a free software product. You can redistribute it and/or * modify it under the terms of the GNU Affero General Public License (AGPL) * version 3 as published by the Free Software Foundation. In accordance with * Section 7(a) of the GNU AGPL its Section 15 shall be amended to the effect * that Ascensio System SIA expressly excludes the warranty of non-infringement * of any third-party rights. * * This program is distributed WITHOUT ANY WARRANTY; without even the implied * warranty of MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. For * details, see the GNU AGPL at: http://www.gnu.org/licenses/agpl-3.0.html * * You can contact Ascensio System SIA at 20A-6 Ernesta Birznieka-Upish * street, Riga, Latvia, EU, LV-1050. * * The interactive user interfaces in modified source and object code versions * of the Program must display Appropriate Legal Notices, as required under * Section 5 of the GNU AGPL version 3. * * Pursuant to Section 7(b) of the License you must retain the original Product * logo when distributing the program. Pursuant to Section 7(e) we decline to * grant you any rights under trademark law for use of our trademarks. * * All the Product's GUI elements, including illustrations and icon sets, as * well as technical writing content are licensed under the terms of the * Creative Commons Attribution-ShareAlike 4.0 International. See the License * terms at http://creativecommons.org/licenses/by-sa/4.0/legalcode * */ #pragma once #include "StructuredStorageReader.h" #include "FileInformationBlock.h" #include "PieceTable.h" #include "StringTable.h" #include "FontFamilyName.h" #include "WideString.h" #include "Plex.h" #include "AnnotationReferenceDescriptor.h" #include "Tbkd.h" #include "Spa.h" #include "SectionDescriptor.h" #include "SectionPropertyExceptions.h" #include "BookmarkFirst.h" #include "StyleSheet.h" #include "FormattedDiskPagePAPX.h" #include "FormattedDiskPageCHPX.h" #include "ListTable.h" #include "AnnotationOwnerList.h" #include "DocumentProperties.h" #include "EncryptionHeader.h" #include "ListFormatOverrideTable.h" #include "OfficeArtContent.h" #include "HeaderAndFooterTable.h" #include "FootnoteDescriptor.h" #include "EndnoteDescriptor.h" #include "FieldCharacter.h" #include "IVisitable.h" #include "../../Common/MS-LCID.h" #include "../../Common/cfcpp/compoundfile.h" namespace CRYPT { class Decryptor; } namespace DocFileFormat { class WordDocument : public IVisitable { friend class FootnotesMapping; friend class EndnotesMapping; friend class CommentsMapping; friend class Converter; friend class CharacterPropertiesMapping; friend class DocumentMapping; friend class MainDocumentMapping; friend class NumberingMapping; friend class ParagraphPropertiesMapping; friend class StyleSheetMapping; friend class HeaderMapping; friend class FooterMapping; friend class SectionPropertiesMapping; friend class Table; friend class TableRow; friend class VMLShapeMapping; friend class VMLPictureMapping; friend class OpenXmlPackage; friend class TextboxMapping; friend class SettingsMapping; friend class WordprocessingDocument; public: WordDocument(const std::wstring& tempFolder, const int userLCID); virtual ~WordDocument(); _UINT32 LoadDocument(const std::wstring& fileName, const std::wstring& password); int nWordVersion; int nDocumentCodePage; bool bDocumentCodePage; int nFontsCodePage; int nDocumentCodePageInfo; bool bErrorFile = false; inline StructuredStorageReader* GetStorage() const { return m_pStorage; } inline POLE::Stream* GetDocumentStream() const { return WordDocumentStream; } private: bool LoadDocumentFlat(); bool DecryptOfficeFile(CRYPT::Decryptor* Decryptor); bool DecryptStream(std::wstring streamName_open, POLE::Storage* storageIn, std::wstring streamName_create, std::shared_ptr storageOut, CRYPT::Decryptor* Decryptor, bool bDecrypt); void DecryptStream(int level, std::wstring streamName, POLE::Storage* storageIn, std::shared_ptr storageOut, CRYPT::Decryptor* Decryptor); inline OfficeArtContent* GetOfficeArt() { return officeArtContent; } inline int FindFileCharPos(int cp) { if (FIB->m_FibBase.fComplex) { if (!m_PieceTable) return -1; if ((!m_PieceTable->FileCharacterPositions) || (m_PieceTable->FileCharacterPositions->empty())) return -1; std::map::iterator it = m_PieceTable->FileCharacterPositions->find(cp); return (it != m_PieceTable->FileCharacterPositions->end()) ? it->second : -1; } else { int fc = cp + FIB->m_FibBase.fcMin; if (fc > FIB->m_FibBase.fcMac) return -1; return fc; } } std::vector* GetEncodingChars(int fcStart, int fcEnd); std::vector* GetChars(int fcStart, int fcEnd, int cp); std::vector* GetFileCharacterPositions(int fcMin, int fcMax); std::vector* GetCharacterPropertyExceptions(int fcMin, int fcMax); void Clear(); MS_LCID_converter m_lcidConverter; std::wstring m_sFileName; std::wstring m_sPassword; std::wstring m_sTempFolder; std::wstring m_sTempDecryptFileName; int m_nUserLCID; std::wstring m_sXmlApp; std::wstring m_sXmlCore; POLE::Stream* WordDocumentStream; // The stream "WordDocument" POLE::Stream* TableStream; // The stream "0Table" or "1Table" POLE::Stream* DataStream; // The stream called "Data" StructuredStorageReader* m_pStorage; //POLE::Storage* Storage std::vector* Text; // All text of the Word document std::vector* AllPapxFkps; // A list of all FKPs that contain PAPX std::vector* AllChpxFkps; // A list of all FKPs that contain CHPX std::map* AllPapx; // The value is the PAPX that formats the paragraph. std::map* AllSepx; // The value is the SEPX that formats the section. std::vector* AllPapxVector;// A vector to quick find in AllPapx std::map PictureBulletsCPsMap; std::map m_mapBadCP; struct _bmkStartEnd { int start; int end; _UINT32 bookmarkId; }; std::vector<_bmkStartEnd> BookmarkStartEndCPs; std::vector<_bmkStartEnd> BookmarkProtStartEndCPs; std::vector<_bmkStartEnd> AnnotStartEndCPs; std::map mapAnnotBookmarks; //id, index std::map mapProtBookmarks; FileInformationBlock* FIB; StyleSheet* Styles; // The style sheet of the document PieceTable* m_PieceTable; // PieceTable PieceTable; ListFormatOverrideTable* listFormatOverrideTable; // lists and numberings in the document. HeaderAndFooterTable* headerAndFooterTable; AnnotationOwnerList* AnnotationOwners; ListTable* listTable; // list numberings in the document. WordDocumentProperties* DocProperties; EncryptionHeader* encryptionHeader; OfficeArtContent* officeArtContent; // info about the drawings in the document. StringTable* RevisionAuthorTable; StringTable* FontTable; // A list of all font names, used in the doucument StringTable* BookmarkNames; StringTable* AutoTextNames; StringTable* AssocNames; StringTable* BkmkAnnotNames; StringTable* Captions; StringTable* AutoCaptions; StringTableEx* BkmkProt; StringTable* BkmkProtUser; Plex* IndividualFootnotesPlex; //A plex of locations of individual footnotes Plex* FootnoteReferenceCharactersPlex; //A plex of footnote reference characters Plex* IndividualEndnotesPlex; //A plex of locations of individual endnotes Plex* EndnoteReferenceCharactersPlex; //A plex of endnote reference characters Plex* HeaderStoriesPlex; //A plex of the header document Plex* IndividualCommentsPlex; // A plex with all ATRDPre10 structs Plex* TextboxIndividualPlex; Plex* TextboxBreakPlex; // Describes the breaks inside the textbox subdocument Plex* TextboxBreakPlexHeader; // Describes the breaks inside the header textbox subdocument Plex* OutlineListDescriptorPlex; Plex* OfficeDrawingPlex; Plex* OfficeDrawingPlexHeader; Plex* SectionPlex; Plex* BookmarkStartPlex; Plex* BookmarkEndPlex; Plex* AnnotStartPlex; Plex* AnnotEndPlex; Plex* BookmarkProtStartPlex; Plex* BookmarkProtEndPlex; Plex* ListPlex; Plex* FieldsPlex; Plex* FootnoteDocumentFieldsPlex; Plex* EndnoteDocumentFieldsPlex; Plex* HeadersAndFootersDocumentFieldsPlex; Plex* AnnotationsFieldsPlex; Plex* AnnotationsReferencePlex; Plex* AutoTextPlex; AnnotationReferenceExDescriptors* AnnotationsReferencesEx; //------------------------------------------------------------------------------ void CorrectColor(ODRAW::OfficeArtCOLORREF& color, int base_color, int type = 1); //fill, back, shadow, text, border }; }