/* -*- Mode: C++; tab-width: 4; indent-tabs-mode: t; c-basic-offset: 4 -*- */
/* libwpd
* Version: MPL 2.0 / LGPLv2.1+
*
* This Source Code Form is subject to the terms of the Mozilla Public
* License, v. 2.0. If a copy of the MPL was not distributed with this
* file, You can obtain one at http://mozilla.org/MPL/2.0/.
*
* Major Contributor(s):
* Copyright (C) 2003 William Lachance (wrlach@gmail.com)
* Copyright (C) 2003 Marc Maurer (uwog@uwog.net)
* Copyright (C) 2006 Fridrich Strba (fridrich.strba@bluewin.ch)
*
* For minor contributions see the git repository.
*
* Alternatively, the contents of this file may be used under the terms
* of the GNU Lesser General Public License Version 2.1 or later
* (LGPLv2.1+), in which case the provisions of the LGPLv2.1+ are
* applicable instead of those above.
*
* For further information visit http://libwpd.sourceforge.net
*/
/* "This product is not manufactured, approved, or supported by
* Corel Corporation or Corel Corporation Limited."
*/
#include "WP42Parser.h"
#include <memory>
#include "WP42Part.h"
#include "WPXHeader.h"
#include "libwpd_internal.h"
#include "WPXTable.h"
#include "WP42FileStructure.h"
#include "WP42StylesListener.h"
#include "WP42ContentListener.h"
WP42Parser::WP42Parser(librevenge::RVNGInputStream *input, WPXEncryption *encryption) :
WPXParser(input, nullptr, encryption)
{
}
WP42Parser::~WP42Parser()
{
}
void WP42Parser::parse(librevenge::RVNGInputStream *input, WPXEncryption *encryption, WP42Listener *listener)
{
listener->startDocument();
input->seek(0, librevenge::RVNG_SEEK_SET);
WPD_DEBUG_MSG(("WordPerfect: Starting document body parse (position = %ld)\n",(long)input->tell()));
parseDocument(input, encryption, listener);
listener->endDocument();
}
// parseDocument: parses a document body (may call itself recursively, on other streams, or itself)
void WP42Parser::parseDocument(librevenge::RVNGInputStream *input, WPXEncryption *encryption, WP42Listener *listener)
{
while (!input->isEnd())
{
unsigned char readVal;
readVal = readU8(input, encryption);
if (readVal < (unsigned char)0x20)
{
WPD_DEBUG_MSG(("Offset: %i, Handling Control Character 0x%2x\n", (unsigned int)input->tell(), readVal));
switch (readVal)
{
case 0x09: // tab
listener->insertTab(0, 0.0);
break;
case 0x0A: // hard new line
listener->insertEOL();
break;
case 0x0B: // soft new page
listener->insertBreak(WPX_SOFT_PAGE_BREAK);
break;
case 0x0C: // hard new page
listener->insertBreak(WPX_PAGE_BREAK);
break;
case 0x0D: // soft new line
listener->insertCharacter(' ');
break;
default:
// unsupported or undocumented token, ignore
break;
}
}
else if (readVal >= (unsigned char)0x20 && readVal <= (unsigned char)0x7F)
{
WPD_DEBUG_MSG(("Offset: %i, Handling Ascii Character 0x%2x\n", (unsigned int)input->tell(), readVal));
// normal ASCII characters
listener->insertCharacter(readVal);
}
else if (readVal >= (unsigned char)0x80 && readVal <= (unsigned char)0xBF)
{
WPD_DEBUG_MSG(("Offset: %i, Handling Single Character Function 0x%2x\n", (unsigned int)input->tell(), readVal));
// single character function codes
switch (readVal)
{
case 0x92:
listener->attributeChange(true, WP42_ATTRIBUTE_STRIKE_OUT);
break;
case 0x93:
listener->attributeChange(false, WP42_ATTRIBUTE_STRIKE_OUT);
break;
case 0x94:
listener->attributeChange(true, WP42_ATTRIBUTE_UNDERLINE);
break;
case 0x95:
listener->attributeChange(false, WP42_ATTRIBUTE_UNDERLINE);
break;
case 0x90:
listener->attributeChange(true, WP42_ATTRIBUTE_REDLINE);
break;
case 0x91:
listener->attributeChange(false, WP42_ATTRIBUTE_REDLINE);
break;
case 0x9C:
listener->attributeChange(false, WP42_ATTRIBUTE_BOLD);
break;
case 0x9D:
listener->attributeChange(true, WP42_ATTRIBUTE_BOLD);
break;
case 0xB2:
listener->attributeChange(true, WP42_ATTRIBUTE_ITALICS);
break;
case 0xB3:
listener->attributeChange(false, WP42_ATTRIBUTE_ITALICS);
break;
case 0xB4:
listener->attributeChange(true, WP42_ATTRIBUTE_SHADOW);
break;
case 0xB5:
listener->attributeChange(false, WP42_ATTRIBUTE_SHADOW);
break;
default:
// unsupported or undocumented token, ignore
break;
}
}
else if (readVal >= (unsigned char)0xC0 && readVal <= (unsigned char)0xFE)
{
std::unique_ptr<WP42Part> part(WP42Part::constructPart(input, encryption, readVal));
if (part)
part->parse(listener);
}
// ignore the rest since they are not documented and at least 0xFF is a special character that
// marks end of variable length part in variable length multi-byte functions
}
}
void WP42Parser::parse(librevenge::RVNGTextInterface *documentInterface)
{
librevenge::RVNGInputStream *input = getInput();
WPXEncryption *encryption = getEncryption();
std::list<WPXPageSpan> pageList;
std::vector<WP42SubDocument *> subDocuments;
try
{
// do a "first-pass" parse of the document
// gather table border information, page properties (per-page)
WP42StylesListener stylesListener(pageList, subDocuments);
parse(input, encryption, &stylesListener);
// postprocess the pageList == remove duplicate page spans due to the page breaks
std::list<WPXPageSpan>::iterator previousPage = pageList.begin();
for (std::list<WPXPageSpan>::iterator Iter=pageList.begin(); Iter != pageList.end();)
{
if ((Iter != previousPage) && ((*previousPage)==(*Iter)))
{
(*previousPage).setPageSpan((*previousPage).getPageSpan() + (*Iter).getPageSpan());
Iter = pageList.erase(Iter);
}
else
{
previousPage = Iter;
++Iter;
}
}
// second pass: here is where we actually send the messages to the target app
// that are necessary to emit the body of the target document
WP42ContentListener listener(pageList, subDocuments, documentInterface);
parse(input, encryption, &listener);
// cleanup section: free the used resources
for (auto &subDocument : subDocuments)
{
if (subDocument)
delete subDocument;
}
}
catch (FileException)
{
WPD_DEBUG_MSG(("WordPerfect: File Exception. Parse terminated prematurely."));
for (auto &subDocument : subDocuments)
{
if (subDocument)
delete subDocument;
}
throw FileException();
}
}
void WP42Parser::parseSubDocument(librevenge::RVNGTextInterface *documentInterface)
{
std::list<WPXPageSpan> pageList;
std::vector<WP42SubDocument *> subDocuments;
librevenge::RVNGInputStream *input = getInput();
try
{
WP42StylesListener stylesListener(pageList, subDocuments);
stylesListener.startSubDocument();
parseDocument(input, nullptr, &stylesListener);
stylesListener.endSubDocument();
WP42ContentListener listener(pageList, subDocuments, documentInterface);
listener.startSubDocument();
parseDocument(input, nullptr, &listener);
listener.endSubDocument();
for (auto &subDocument : subDocuments)
if (subDocument)
delete subDocument;
}
catch (FileException)
{
WPD_DEBUG_MSG(("WordPerfect: File Exception. Parse terminated prematurely."));
for (auto &subDocument : subDocuments)
if (subDocument)
delete subDocument;
throw FileException();
}
}
/* vim:set shiftwidth=4 softtabstop=4 noexpandtab: */