Blame libdjvu/UnicodeByteStream.cpp

Packit df99a1
//C-  -*- C++ -*-
Packit df99a1
//C- -------------------------------------------------------------------
Packit df99a1
//C- DjVuLibre-3.5
Packit df99a1
//C- Copyright (c) 2002  Leon Bottou and Yann Le Cun.
Packit df99a1
//C- Copyright (c) 2001  AT&T
Packit df99a1
//C-
Packit df99a1
//C- This software is subject to, and may be distributed under, the
Packit df99a1
//C- GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- or (at your option) any later version. The license should have
Packit df99a1
//C- accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C-
Packit df99a1
//C- This program is distributed in the hope that it will be useful,
Packit df99a1
//C- but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit df99a1
//C- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit df99a1
//C- GNU General Public License for more details.
Packit df99a1
//C- 
Packit df99a1
//C- DjVuLibre-3.5 is derived from the DjVu(r) Reference Library from
Packit df99a1
//C- Lizardtech Software.  Lizardtech Software has authorized us to
Packit df99a1
//C- replace the original DjVu(r) Reference Library notice by the following
Packit df99a1
//C- text (see doc/lizard2002.djvu and doc/lizardtech2007.djvu):
Packit df99a1
//C-
Packit df99a1
//C-  ------------------------------------------------------------------
Packit df99a1
//C- | DjVu (r) Reference Library (v. 3.5)
Packit df99a1
//C- | Copyright (c) 1999-2001 LizardTech, Inc. All Rights Reserved.
Packit df99a1
//C- | The DjVu Reference Library is protected by U.S. Pat. No.
Packit df99a1
//C- | 6,058,214 and patents pending.
Packit df99a1
//C- |
Packit df99a1
//C- | This software is subject to, and may be distributed under, the
Packit df99a1
//C- | GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- | or (at your option) any later version. The license should have
Packit df99a1
//C- | accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- | from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C- |
Packit df99a1
//C- | The computer code originally released by LizardTech under this
Packit df99a1
//C- | license and unmodified by other parties is deemed "the LIZARDTECH
Packit df99a1
//C- | ORIGINAL CODE."  Subject to any third party intellectual property
Packit df99a1
//C- | claims, LizardTech grants recipient a worldwide, royalty-free, 
Packit df99a1
//C- | non-exclusive license to make, use, sell, or otherwise dispose of 
Packit df99a1
//C- | the LIZARDTECH ORIGINAL CODE or of programs derived from the 
Packit df99a1
//C- | LIZARDTECH ORIGINAL CODE in compliance with the terms of the GNU 
Packit df99a1
//C- | General Public License.   This grant only confers the right to 
Packit df99a1
//C- | infringe patent claims underlying the LIZARDTECH ORIGINAL CODE to 
Packit df99a1
//C- | the extent such infringement is reasonably necessary to enable 
Packit df99a1
//C- | recipient to make, have made, practice, sell, or otherwise dispose 
Packit df99a1
//C- | of the LIZARDTECH ORIGINAL CODE (or portions thereof) and not to 
Packit df99a1
//C- | any greater extent that may be necessary to utilize further 
Packit df99a1
//C- | modifications or combinations.
Packit df99a1
//C- |
Packit df99a1
//C- | The LIZARDTECH ORIGINAL CODE is provided "AS IS" WITHOUT WARRANTY
Packit df99a1
//C- | OF ANY KIND, EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
Packit df99a1
//C- | TO ANY WARRANTY OF NON-INFRINGEMENT, OR ANY IMPLIED WARRANTY OF
Packit df99a1
//C- | MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
Packit df99a1
//C- +------------------------------------------------------------------
Packit df99a1
Packit df99a1
#ifdef HAVE_CONFIG_H
Packit df99a1
# include "config.h"
Packit df99a1
#endif
Packit df99a1
#if NEED_GNUG_PRAGMAS
Packit df99a1
# pragma implementation
Packit df99a1
#endif
Packit df99a1
Packit df99a1
#include "UnicodeByteStream.h"
Packit df99a1
#include "ByteStream.h"
Packit df99a1
Packit df99a1
Packit df99a1
#ifdef HAVE_NAMESPACES
Packit df99a1
namespace DJVU {
Packit df99a1
# ifdef NOT_DEFINED // Just to fool emacs c++ mode
Packit df99a1
}
Packit df99a1
#endif
Packit df99a1
#endif
Packit df99a1
Packit df99a1
UnicodeByteStream::UnicodeByteStream(const UnicodeByteStream &uni)
Packit df99a1
: bs(uni.bs), buffer(uni.buffer), bufferpos(uni.bufferpos), linesread(0)
Packit df99a1
{
Packit df99a1
  startpos=bs->tell();
Packit df99a1
}
Packit df99a1
Packit df99a1
UnicodeByteStream::UnicodeByteStream(
Packit df99a1
  GP<ByteStream> ibs,const GStringRep::EncodeType et)
Packit df99a1
: bs(ibs), bufferpos(0), linesread(0)
Packit df99a1
{
Packit df99a1
  buffer=GUTF8String::create(0,0,et);
Packit df99a1
  startpos=bs->tell();
Packit df99a1
}
Packit df99a1
Packit df99a1
UnicodeByteStream::~UnicodeByteStream()
Packit df99a1
{}
Packit df99a1
Packit df99a1
static int
Packit df99a1
CountLines(const GUTF8String &str)
Packit df99a1
{
Packit df99a1
  int retval=0;
Packit df99a1
  static const unsigned long lf='\n';
Packit df99a1
  for(int pos=0;(pos=str.search(lf,pos)+1)>0;++retval)
Packit df99a1
    EMPTY_LOOP;
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
void
Packit df99a1
UnicodeByteStream::set_encodetype(const GStringRep::EncodeType et)
Packit df99a1
{
Packit df99a1
  seek(startpos,SEEK_SET);
Packit df99a1
  bufferpos=0;
Packit df99a1
  buffer=GUTF8String::create(0,0,et);
Packit df99a1
}
Packit df99a1
Packit df99a1
void
Packit df99a1
UnicodeByteStream::set_encoding(const GUTF8String &xencoding)
Packit df99a1
{
Packit df99a1
  seek(startpos,SEEK_SET);
Packit df99a1
  bufferpos=0;
Packit df99a1
  buffer=GUTF8String::create(0,0,xencoding);
Packit df99a1
}
Packit df99a1
Packit df99a1
size_t
Packit df99a1
UnicodeByteStream::read(void *buf, size_t size)
Packit df99a1
{
Packit df99a1
  bufferpos=0;
Packit df99a1
  const int retval=bs->read(buf,size);
Packit df99a1
  if(retval)
Packit df99a1
  {
Packit df99a1
    buffer=GUTF8String::create(
Packit df99a1
      (unsigned char const *)buf,retval,buffer.get_remainder());
Packit df99a1
  }else
Packit df99a1
  {
Packit df99a1
    buffer=GUTF8String::create(0,0,buffer.get_remainder());
Packit df99a1
  }
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
size_t
Packit df99a1
UnicodeByteStream::write(const void *buf, size_t size)
Packit df99a1
{
Packit df99a1
  bufferpos=0;
Packit df99a1
  buffer=GUTF8String::create(0,0,buffer.get_remainder());
Packit df99a1
  return bs->write(buf,size);
Packit df99a1
}
Packit df99a1
Packit df99a1
long 
Packit df99a1
UnicodeByteStream::tell(void) const
Packit df99a1
{
Packit df99a1
  return bs->tell();
Packit df99a1
}
Packit df99a1
Packit df99a1
UnicodeByteStream & 
Packit df99a1
UnicodeByteStream::operator=(UnicodeByteStream &uni)
Packit df99a1
{
Packit df99a1
  bs=uni.bs;
Packit df99a1
  bufferpos=uni.bufferpos;
Packit df99a1
  buffer=uni.buffer;
Packit df99a1
  return *this;
Packit df99a1
}
Packit df99a1
Packit df99a1
int 
Packit df99a1
UnicodeByteStream::seek
Packit df99a1
(long offset, int whence, bool nothrow)
Packit df99a1
{
Packit df99a1
  int retval=bs->seek(offset,whence,nothrow);
Packit df99a1
  bufferpos=0;
Packit df99a1
  buffer=GUTF8String::create(0,0,buffer.get_remainder());
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
void 
Packit df99a1
UnicodeByteStream::flush(void)
Packit df99a1
{
Packit df99a1
  bs->flush();
Packit df99a1
  bufferpos=0;
Packit df99a1
  buffer=GUTF8String::create(0,0,buffer.get_remainder());
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
GUTF8String
Packit df99a1
UnicodeByteStream::gets(
Packit df99a1
  size_t const t,unsigned long const stopat,bool const inclusive)
Packit df99a1
{
Packit df99a1
  GUTF8String retval;
Packit df99a1
  unsigned int len=buffer.length()-bufferpos;
Packit df99a1
  if(!len)
Packit df99a1
  {
Packit df99a1
    int i;
Packit df99a1
    char *buf;
Packit df99a1
  	static const size_t bufsize=327680;
Packit df99a1
    GPBuffer<char> gbuf(buf,bufsize);
Packit df99a1
    while((i=read(buf,bufsize)>0))
Packit df99a1
    {
Packit df99a1
      if((len=buffer.length()-bufferpos))
Packit df99a1
        break;
Packit df99a1
    }
Packit df99a1
  }
Packit df99a1
  if(len)
Packit df99a1
  {
Packit df99a1
    int i=buffer.search((char)stopat,bufferpos);
Packit df99a1
    if(i>=0)
Packit df99a1
    {
Packit df99a1
      if(inclusive)
Packit df99a1
      {
Packit df99a1
        ++i;
Packit df99a1
      }
Packit df99a1
      if(t&&(i>(int)t+bufferpos))
Packit df99a1
      {
Packit df99a1
        i=t+bufferpos;
Packit df99a1
      }
Packit df99a1
      if(i>bufferpos)
Packit df99a1
      {
Packit df99a1
        retval=buffer.substr(bufferpos,i-bufferpos);
Packit df99a1
      }
Packit df99a1
      bufferpos=i;
Packit df99a1
      linesread+=CountLines(retval);
Packit df99a1
    }else
Packit df99a1
    {
Packit df99a1
      retval=buffer.substr(bufferpos,len);
Packit df99a1
      bufferpos=buffer.length();
Packit df99a1
      linesread+=CountLines(retval);
Packit df99a1
      retval+=gets(t?(t-(i-bufferpos)):0,stopat,inclusive);
Packit df99a1
    }
Packit df99a1
  }
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
XMLByteStream::XMLByteStream(UnicodeByteStream &uni)
Packit df99a1
: UnicodeByteStream(uni) {}
Packit df99a1
Packit df99a1
XMLByteStream::XMLByteStream(GP<ByteStream> &ibs) 
Packit df99a1
: UnicodeByteStream(ibs,GStringRep::XOTHER)
Packit df99a1
{}
Packit df99a1
Packit df99a1
GP<XMLByteStream>
Packit df99a1
XMLByteStream::create(GP<ByteStream> ibs) 
Packit df99a1
{
Packit df99a1
  XMLByteStream *xml=new XMLByteStream(ibs);
Packit df99a1
  GP<XMLByteStream> retval=xml;
Packit df99a1
  xml->init();
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
void
Packit df99a1
XMLByteStream::init(void)
Packit df99a1
{
Packit df99a1
  unsigned char buf[4];
Packit df99a1
  GP<ByteStream> ibs=bs;
Packit df99a1
  bufferpos=0;
Packit df99a1
  bs->readall(buf,sizeof(buf));
Packit df99a1
  const unsigned int i=(buf[0]<<8)+buf[1];
Packit df99a1
  switch(i)
Packit df99a1
  {
Packit df99a1
    case 0x0000:
Packit df99a1
    {
Packit df99a1
      const unsigned int j=(buf[2]<<8)+buf[3];
Packit df99a1
      switch(j)
Packit df99a1
      {
Packit df99a1
        case 0x003C:
Packit df99a1
        {
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUCS4BE);
Packit df99a1
          break;
Packit df99a1
        }
Packit df99a1
        case 0x3C00:
Packit df99a1
        {
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUCS4_2143);
Packit df99a1
          break;
Packit df99a1
        }
Packit df99a1
        case 0xFEFF:
Packit df99a1
        {
Packit df99a1
          buffer=GUTF8String::create(0,0,GStringRep::XUCS4BE);
Packit df99a1
          startpos+=sizeof(buf);
Packit df99a1
          break;
Packit df99a1
        }
Packit df99a1
        case 0xFFFE:
Packit df99a1
        {
Packit df99a1
          buffer=GUTF8String::create(0,0,GStringRep::XUCS4_2143);
Packit df99a1
          startpos+=sizeof(buf);
Packit df99a1
          break;
Packit df99a1
        }
Packit df99a1
        default:
Packit df99a1
        {
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF8);
Packit df99a1
          break;
Packit df99a1
        }
Packit df99a1
      }
Packit df99a1
    }
Packit df99a1
    case 0x003C:
Packit df99a1
    {
Packit df99a1
      const unsigned int j=(buf[2]<<8)+buf[3];
Packit df99a1
      switch(j)
Packit df99a1
      {
Packit df99a1
        case 0x0000:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUCS4_3412);
Packit df99a1
          break;
Packit df99a1
        case 0x003F:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF16BE);
Packit df99a1
          break;
Packit df99a1
        default:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF8);
Packit df99a1
          break;
Packit df99a1
      }
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0x3C00:
Packit df99a1
    {
Packit df99a1
      const unsigned int j=(buf[2]<<8)+buf[3];
Packit df99a1
      switch(j)
Packit df99a1
      {
Packit df99a1
        case 0x0000:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUCS4LE);
Packit df99a1
          break;
Packit df99a1
        case 0x3F00:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF16LE);
Packit df99a1
          break;
Packit df99a1
        default:
Packit df99a1
          buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF8);
Packit df99a1
          break;
Packit df99a1
      }
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0x4C6F:
Packit df99a1
    {
Packit df99a1
      const unsigned int j=(buf[2]<<8)+buf[3];
Packit df99a1
      buffer=GUTF8String::create(buf,sizeof(buf),
Packit df99a1
         (j == 0xA794)?(GStringRep::XEBCDIC):(GStringRep::XUTF8));
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0xFFFE:
Packit df99a1
    {
Packit df99a1
      buffer=GUTF8String::create(buf+2,sizeof(buf)-2,GStringRep::XUTF16LE);
Packit df99a1
      startpos+=2;
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0xFEFF:
Packit df99a1
    {
Packit df99a1
      buffer=GUTF8String::create(buf+2,sizeof(buf)-2,GStringRep::XUTF16BE);
Packit df99a1
      startpos+=2;
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0xEFBB:
Packit df99a1
    {
Packit df99a1
      if(buf[2] == 0xBF)
Packit df99a1
      {
Packit df99a1
        buffer=GUTF8String::create(buf+3,sizeof(buf)-3,GStringRep::XUTF8);
Packit df99a1
        startpos+=3;
Packit df99a1
      }else
Packit df99a1
      {
Packit df99a1
        buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF8);
Packit df99a1
      }
Packit df99a1
      break;
Packit df99a1
    }
Packit df99a1
    case 0x3C3F:
Packit df99a1
    default:
Packit df99a1
    {
Packit df99a1
      buffer=GUTF8String::create(buf,sizeof(buf),GStringRep::XUTF8);
Packit df99a1
    }
Packit df99a1
  }
Packit df99a1
  bs=ibs;
Packit df99a1
}
Packit df99a1
Packit df99a1
XMLByteStream::~XMLByteStream()
Packit df99a1
{}
Packit df99a1
Packit df99a1
Packit df99a1
#ifdef HAVE_NAMESPACES
Packit df99a1
}
Packit df99a1
# ifndef NOT_USING_DJVU_NAMESPACE
Packit df99a1
using namespace DJVU;
Packit df99a1
# endif
Packit df99a1
#endif