WPParser.hxx
Go to the documentation of this file.
00001 /* -*- Mode: C++; c-default-style: "k&r"; indent-tabs-mode: nil; tab-width: 2; c-basic-offset: 2 -*- */
00002 
00003 /* libmwaw
00004 * Version: MPL 2.0 / LGPLv2+
00005 *
00006 * The contents of this file are subject to the Mozilla Public License Version
00007 * 2.0 (the "License"); you may not use this file except in compliance with
00008 * the License or as specified alternatively below. You may obtain a copy of
00009 * the License at http://www.mozilla.org/MPL/
00010 *
00011 * Software distributed under the License is distributed on an "AS IS" basis,
00012 * WITHOUT WARRANTY OF ANY KIND, either express or implied. See the License
00013 * for the specific language governing rights and limitations under the
00014 * License.
00015 *
00016 * Major Contributor(s):
00017 * Copyright (C) 2002 William Lachance (wrlach@gmail.com)
00018 * Copyright (C) 2002,2004 Marc Maurer (uwog@uwog.net)
00019 * Copyright (C) 2004-2006 Fridrich Strba (fridrich.strba@bluewin.ch)
00020 * Copyright (C) 2006, 2007 Andrew Ziem
00021 * Copyright (C) 2011, 2012 Alonso Laurent (alonso@loria.fr)
00022 *
00023 *
00024 * All Rights Reserved.
00025 *
00026 * For minor contributions see the git repository.
00027 *
00028 * Alternatively, the contents of this file may be used under the terms of
00029 * the GNU Lesser General Public License Version 2 or later (the "LGPLv2+"),
00030 * in which case the provisions of the LGPLv2+ are applicable
00031 * instead of those above.
00032 */
00033 
00034 /*
00035  * Parser to convert some WriterPlus text document ( a french text editor )
00036  *
00037  */
00038 #ifndef WP_PARSER
00039 #  define WP_PARSER
00040 
00041 #include <list>
00042 #include <string>
00043 #include <vector>
00044 
00045 #include "MWAWDebug.hxx"
00046 #include "MWAWEntry.hxx"
00047 #include "MWAWInputStream.hxx"
00048 
00049 #include "MWAWParser.hxx"
00050 
00051 namespace WPParserInternal
00052 {
00053 struct State;
00054 struct Font;
00055 struct Line;
00056 struct ParagraphData;
00057 struct ParagraphInfo;
00058 class SubDocument;
00059 }
00060 
00066 class WPParser : public MWAWParser
00067 {
00068   friend class WPParserInternal::SubDocument;
00069 
00070 public:
00072   WPParser(MWAWInputStreamPtr input, MWAWRSRCParserPtr rsrcParser, MWAWHeader *header);
00074   virtual ~WPParser();
00075 
00077   bool checkHeader(MWAWHeader *header, bool strict=false);
00078 
00079   // the main parse function
00080   void parse(WPXDocumentInterface *documentInterface);
00081 
00082 protected:
00084   void init();
00085 
00087   void createDocument(WPXDocumentInterface *documentInterface);
00088 
00090   bool createZones();
00091 
00093   bool readPrintInfo();
00094 
00096   bool readWindowsInfo(int zone);
00097 
00099   bool sendWindow(int zone, Vec2i limits = Vec2i(-1,-1));
00100 
00102   bool readWindowsZone(int zone);
00103 
00105   bool readPageInfo(int zone);
00106 
00108   bool readColInfo(int zone);
00109 
00111   bool readParagraphInfo(int zone);
00112 
00114   bool findSection(int zone, Vec2i limits, MWAWSection &sec);
00115 
00117   bool readSection(WPParserInternal::ParagraphInfo const &info, bool mainBlock);
00118 
00120   bool readText(WPParserInternal::ParagraphInfo const &info);
00121 
00123   bool readTable(WPParserInternal::ParagraphInfo const &info);
00124 
00126   bool readGraphic(WPParserInternal::ParagraphInfo const &info);
00127 
00129   bool readUnknown(WPParserInternal::ParagraphInfo const &info);
00130 
00132   double getTextHeight() const;
00133 
00135   void newPage(int number);
00136 
00137   //
00138   // low level
00139   //
00140 
00142   bool readParagraphData(WPParserInternal::ParagraphInfo const &info, bool hasFonts,
00143                          WPParserInternal::ParagraphData &data);
00145   MWAWParagraph getParagraph(WPParserInternal::ParagraphData const &data);
00147   bool readFonts(int nFonts, int type,
00148                  std::vector<WPParserInternal::Font> &fonts);
00149 
00151   bool readLines(WPParserInternal::ParagraphInfo const &info,
00152                  int nLines, std::vector<WPParserInternal::Line> &lines);
00153 
00154 protected:
00155   //
00156   // data
00157   //
00158 
00160   shared_ptr<WPParserInternal::State> m_state;
00161 };
00162 #endif
00163 // vim: set filetype=cpp tabstop=2 shiftwidth=2 cindent autoindent smartindent noexpandtab: