Blame libdjvu/BSEncodeByteStream.cpp

Packit df99a1
//C-  -*- C++ -*-
Packit df99a1
//C- -------------------------------------------------------------------
Packit df99a1
//C- DjVuLibre-3.5
Packit df99a1
//C- Copyright (c) 2002  Leon Bottou and Yann Le Cun.
Packit df99a1
//C- Copyright (c) 2001  AT&T
Packit df99a1
//C-
Packit df99a1
//C- This software is subject to, and may be distributed under, the
Packit df99a1
//C- GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- or (at your option) any later version. The license should have
Packit df99a1
//C- accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C-
Packit df99a1
//C- This program is distributed in the hope that it will be useful,
Packit df99a1
//C- but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit df99a1
//C- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit df99a1
//C- GNU General Public License for more details.
Packit df99a1
//C- 
Packit df99a1
//C- DjVuLibre-3.5 is derived from the DjVu(r) Reference Library from
Packit df99a1
//C- Lizardtech Software.  Lizardtech Software has authorized us to
Packit df99a1
//C- replace the original DjVu(r) Reference Library notice by the following
Packit df99a1
//C- text (see doc/lizard2002.djvu and doc/lizardtech2007.djvu):
Packit df99a1
//C-
Packit df99a1
//C-  ------------------------------------------------------------------
Packit df99a1
//C- | DjVu (r) Reference Library (v. 3.5)
Packit df99a1
//C- | Copyright (c) 1999-2001 LizardTech, Inc. All Rights Reserved.
Packit df99a1
//C- | The DjVu Reference Library is protected by U.S. Pat. No.
Packit df99a1
//C- | 6,058,214 and patents pending.
Packit df99a1
//C- |
Packit df99a1
//C- | This software is subject to, and may be distributed under, the
Packit df99a1
//C- | GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- | or (at your option) any later version. The license should have
Packit df99a1
//C- | accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- | from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C- |
Packit df99a1
//C- | The computer code originally released by LizardTech under this
Packit df99a1
//C- | license and unmodified by other parties is deemed "the LIZARDTECH
Packit df99a1
//C- | ORIGINAL CODE."  Subject to any third party intellectual property
Packit df99a1
//C- | claims, LizardTech grants recipient a worldwide, royalty-free, 
Packit df99a1
//C- | non-exclusive license to make, use, sell, or otherwise dispose of 
Packit df99a1
//C- | the LIZARDTECH ORIGINAL CODE or of programs derived from the 
Packit df99a1
//C- | LIZARDTECH ORIGINAL CODE in compliance with the terms of the GNU 
Packit df99a1
//C- | General Public License.   This grant only confers the right to 
Packit df99a1
//C- | infringe patent claims underlying the LIZARDTECH ORIGINAL CODE to 
Packit df99a1
//C- | the extent such infringement is reasonably necessary to enable 
Packit df99a1
//C- | recipient to make, have made, practice, sell, or otherwise dispose 
Packit df99a1
//C- | of the LIZARDTECH ORIGINAL CODE (or portions thereof) and not to 
Packit df99a1
//C- | any greater extent that may be necessary to utilize further 
Packit df99a1
//C- | modifications or combinations.
Packit df99a1
//C- |
Packit df99a1
//C- | The LIZARDTECH ORIGINAL CODE is provided "AS IS" WITHOUT WARRANTY
Packit df99a1
//C- | OF ANY KIND, EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
Packit df99a1
//C- | TO ANY WARRANTY OF NON-INFRINGEMENT, OR ANY IMPLIED WARRANTY OF
Packit df99a1
//C- | MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
Packit df99a1
//C- +------------------------------------------------------------------
Packit df99a1
Packit df99a1
#ifdef HAVE_CONFIG_H
Packit df99a1
# include "config.h"
Packit df99a1
#endif
Packit df99a1
#if NEED_GNUG_PRAGMAS
Packit df99a1
# pragma implementation
Packit df99a1
#endif
Packit df99a1
Packit df99a1
// - Author: Leon Bottou, 07/1998
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
#include "BSByteStream.h"
Packit df99a1
#include "GString.h"
Packit df99a1
#undef BSORT_TIMER
Packit df99a1
#ifdef BSORT_TIMER
Packit df99a1
#include "GOS.h"
Packit df99a1
#endif
Packit df99a1
Packit df99a1
#include <stddef.h>
Packit df99a1
#include <stdlib.h>
Packit df99a1
#include <stdio.h>
Packit df99a1
#include <string.h>
Packit df99a1
Packit df99a1
Packit df99a1
#ifdef HAVE_NAMESPACES
Packit df99a1
namespace DJVU {
Packit df99a1
# ifdef NOT_DEFINED // Just to fool emacs c++ mode
Packit df99a1
}
Packit df99a1
#endif
Packit df99a1
#endif
Packit df99a1
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// --- Assertion
Packit df99a1
Packit df99a1
#define ASSERT(expr) do{if(!(expr))G_THROW("assertion ("#expr") failed");}while(0)
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// --- Global Definitions
Packit df99a1
            
Packit df99a1
Packit df99a1
#ifdef OVERFLOW
Packit df99a1
#undef OVERFLOW
Packit df99a1
#endif
Packit df99a1
// Overflow required when encoding
Packit df99a1
static const int OVERFLOW=32;
Packit df99a1
Packit df99a1
// Sorting tresholds
Packit df99a1
static const int RANKSORT_THRESH=10;
Packit df99a1
static const int QUICKSORT_STACK=512;
Packit df99a1
static const int PRESORT_THRESH=10;
Packit df99a1
static const int PRESORT_DEPTH=8;
Packit df99a1
static const int RADIX_THRESH=32768;
Packit df99a1
Packit df99a1
static const int FREQS0=100000;
Packit df99a1
static const int FREQS1=1000000;
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// -- Sorting Routines
Packit df99a1
Packit df99a1
  
Packit df99a1
class _BSort  // DJVU_CLASS
Packit df99a1
{
Packit df99a1
public:
Packit df99a1
  ~_BSort();
Packit df99a1
  _BSort(unsigned char *data, int size);
Packit df99a1
  void run(int &markerpos);
Packit df99a1
private:
Packit df99a1
  // Members
Packit df99a1
  int            size;
Packit df99a1
  unsigned char *data;
Packit df99a1
  unsigned int  *posn;
Packit df99a1
  GPBuffer<unsigned int> gposn;
Packit df99a1
  int           *rank;
Packit df99a1
  GPBuffer<int> grank;
Packit df99a1
  // Helpers
Packit df99a1
  inline int GT(int p1, int p2, int depth);
Packit df99a1
  inline int GTD(int p1, int p2, int depth);
Packit df99a1
  // -- final in-depth sort
Packit df99a1
  void ranksort(int lo, int hi, int d);
Packit df99a1
  // -- doubling sort
Packit df99a1
  int  pivot3r(int *rr, int lo, int hi);
Packit df99a1
  void quicksort3r(int lo, int hi, int d);
Packit df99a1
  // -- presort to depth PRESORT_DEPTH
Packit df99a1
  unsigned char pivot3d(unsigned char *dd, int lo, int hi);
Packit df99a1
  void quicksort3d(int lo, int hi, int d);
Packit df99a1
  // -- radixsort
Packit df99a1
  void radixsort16(void);
Packit df99a1
  void radixsort8(void);
Packit df99a1
};
Packit df99a1
Packit df99a1
Packit df99a1
// blocksort -- the main entry point
Packit df99a1
Packit df99a1
static void 
Packit df99a1
blocksort(unsigned char *data, int size, int &markerpos)
Packit df99a1
{
Packit df99a1
  _BSort bsort(data, size);
Packit df99a1
  bsort.run(markerpos);
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort construction
Packit df99a1
Packit df99a1
_BSort::_BSort(unsigned char *xdata, int xsize)
Packit df99a1
  : size(xsize), data(xdata), gposn(posn,xsize), grank(rank,xsize+1)
Packit df99a1
{
Packit df99a1
  ASSERT(size>0 && size<0x1000000);
Packit df99a1
  rank[size] = -1;
Packit df99a1
}
Packit df99a1
Packit df99a1
_BSort::~_BSort()
Packit df99a1
{
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
// GT -- compare suffixes using rank information
Packit df99a1
Packit df99a1
inline int 
Packit df99a1
_BSort::GT(int p1, int p2, int depth)
Packit df99a1
{
Packit df99a1
  int r1, r2;
Packit df99a1
  int twod = depth + depth;
Packit df99a1
  while (1)
Packit df99a1
    {
Packit df99a1
      r1=rank[p1+depth]; r2=rank[p2+depth];
Packit df99a1
      p1+=twod;  p2+=twod;
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1]; r2=rank[p2];
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1+depth]; r2=rank[p2+depth];
Packit df99a1
      p1+=twod;  p2+=twod;
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1]; r2=rank[p2];
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1+depth]; r2=rank[p2+depth];
Packit df99a1
      p1+=twod;  p2+=twod;
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1]; r2=rank[p2];
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1+depth]; r2=rank[p2+depth];
Packit df99a1
      p1+=twod;  p2+=twod;
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
      r1=rank[p1]; r2=rank[p2];
Packit df99a1
      if (r1!=r2) 
Packit df99a1
        return (r1>r2);
Packit df99a1
    };
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::ranksort -- 
Packit df99a1
// -- a simple insertion sort based on GT
Packit df99a1
Packit df99a1
void 
Packit df99a1
_BSort::ranksort(int lo, int hi, int depth)
Packit df99a1
{
Packit df99a1
  int i,j;
Packit df99a1
  for (i=lo+1; i<=hi; i++)
Packit df99a1
    {
Packit df99a1
      int tmp = posn[i];
Packit df99a1
      for(j=i-1; j>=lo && GT(posn[j], tmp, depth); j--)
Packit df99a1
        posn[j+1] = posn[j];
Packit df99a1
      posn[j+1] = tmp;
Packit df99a1
    }
Packit df99a1
  for(i=lo;i<=hi;i++) 
Packit df99a1
    rank[posn[i]]=i;
Packit df99a1
}
Packit df99a1
Packit df99a1
// pivot -- return suitable pivot
Packit df99a1
Packit df99a1
inline int
Packit df99a1
_BSort::pivot3r(int *rr, int lo, int hi)
Packit df99a1
{
Packit df99a1
  int c1, c2, c3;
Packit df99a1
  if (hi-lo > 256)
Packit df99a1
    {
Packit df99a1
      c1 = pivot3r(rr, lo, (6*lo+2*hi)/8);
Packit df99a1
      c2 = pivot3r(rr, (5*lo+3*hi)/8, (3*lo+5*hi)/8);
Packit df99a1
      c3 = pivot3r(rr, (2*lo+6*hi)/8, hi);
Packit df99a1
    }
Packit df99a1
  else
Packit df99a1
    {
Packit df99a1
      c1 = rr[posn[lo]];
Packit df99a1
      c2 = rr[posn[(lo+hi)/2]];
Packit df99a1
      c3 = rr[posn[hi]];
Packit df99a1
    }
Packit df99a1
  // Extract median
Packit df99a1
  if (c1>c3)
Packit df99a1
    { int tmp=c1; c1=c3; c3=tmp; }
Packit df99a1
  if (c2<=c1)
Packit df99a1
    return c1;
Packit df99a1
  else if (c2>=c3)
Packit df99a1
    return c3;
Packit df99a1
  else
Packit df99a1
    return c2;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::quicksort3r -- Three way quicksort algorithm 
Packit df99a1
//    Sort suffixes based on rank at pos+depth
Packit df99a1
//    The algorithm breaks into ranksort when size is 
Packit df99a1
//    smaller than RANKSORT_THRESH
Packit df99a1
Packit df99a1
static inline int
Packit df99a1
mini(int a, int b) 
Packit df99a1
{
Packit df99a1
  return (a<=b) ? a : b;
Packit df99a1
}
Packit df99a1
Packit df99a1
static inline void
Packit df99a1
vswap(int i, int j, int n, unsigned int *x)
Packit df99a1
{
Packit df99a1
  while (n-- > 0) 
Packit df99a1
    { int tmp = x[i]; x[i++]=x[j]; x[j++]=tmp; }
Packit df99a1
}
Packit df99a1
Packit df99a1
void 
Packit df99a1
_BSort::quicksort3r(int lo, int hi, int depth)
Packit df99a1
{
Packit df99a1
  /* Initialize stack */
Packit df99a1
  int slo[QUICKSORT_STACK];
Packit df99a1
  int shi[QUICKSORT_STACK];
Packit df99a1
  int sp = 1;
Packit df99a1
  slo[0] = lo;
Packit df99a1
  shi[0] = hi;
Packit df99a1
  // Recursion elimination loop
Packit df99a1
  while (--sp>=0)
Packit df99a1
    {
Packit df99a1
      lo = slo[sp];
Packit df99a1
      hi = shi[sp];
Packit df99a1
      // Test for insertion sort
Packit df99a1
      if (hi-lo
Packit df99a1
        {
Packit df99a1
          ranksort(lo, hi, depth);
Packit df99a1
        }
Packit df99a1
      else
Packit df99a1
        {
Packit df99a1
          int tmp;
Packit df99a1
          int *rr=rank+depth;
Packit df99a1
          int med = pivot3r(rr,lo,hi);
Packit df99a1
          // -- positions are organized as follows:
Packit df99a1
          //   [lo..l1[ [l1..l[ ]h..h1] ]h1..hi]
Packit df99a1
          //      =        <       >        =
Packit df99a1
          int l1 = lo;
Packit df99a1
          int h1 = hi;
Packit df99a1
          while (rr[posn[l1]]==med && l1
Packit df99a1
          while (rr[posn[h1]]==med && l1
Packit df99a1
          int l = l1;
Packit df99a1
          int h = h1;
Packit df99a1
          // -- partition set
Packit df99a1
          for (;;)
Packit df99a1
            {
Packit df99a1
              while (l<=h)
Packit df99a1
                {
Packit df99a1
                  int c = rr[posn[l]] - med;
Packit df99a1
                  if (c > 0) break;
Packit df99a1
                  if (c == 0) { tmp=posn[l]; posn[l]=posn[l1]; posn[l1++]=tmp; }
Packit df99a1
                  l++;
Packit df99a1
                }
Packit df99a1
              while (l<=h)
Packit df99a1
                {
Packit df99a1
                  int c = rr[posn[h]] - med;
Packit df99a1
                  if (c < 0) break;
Packit df99a1
                  if (c == 0) { tmp=posn[h]; posn[h]=posn[h1]; posn[h1--]=tmp; }
Packit df99a1
                  h--;
Packit df99a1
                }
Packit df99a1
              if (l>h) break;
Packit df99a1
              tmp=posn[l]; posn[l]=posn[h]; posn[h]=tmp;
Packit df99a1
            }
Packit df99a1
          // -- reorganize as follows
Packit df99a1
          //   [lo..l1[ [l1..h1] ]h1..hi]
Packit df99a1
          //      <        =        > 
Packit df99a1
          tmp = mini(l1-lo, l-l1);
Packit df99a1
          vswap(lo, l-tmp, tmp, posn);
Packit df99a1
          l1 = lo + (l-l1);
Packit df99a1
          tmp = mini(hi-h1, h1-h);
Packit df99a1
          vswap(hi-tmp+1, h+1, tmp, posn);
Packit df99a1
          h1 = hi - (h1-h);
Packit df99a1
          // -- process segments
Packit df99a1
          ASSERT(sp+2
Packit df99a1
          // ----- middle segment (=?) [l1, h1]
Packit df99a1
          for(int i=l1;i<=h1;i++) 
Packit df99a1
            rank[posn[i]] = h1;
Packit df99a1
          // ----- lower segment (<) [lo, l1[
Packit df99a1
          if (l1 > lo)
Packit df99a1
            {
Packit df99a1
              for(int i=lo;i
Packit df99a1
                rank[posn[i]]=l1-1;
Packit df99a1
              slo[sp]=lo;
Packit df99a1
              shi[sp]=l1-1;
Packit df99a1
              if (slo[sp] < shi[sp])  
Packit df99a1
                sp++;
Packit df99a1
            }
Packit df99a1
          // ----- upper segment (>) ]h1, hi]
Packit df99a1
          if (h1 < hi)
Packit df99a1
            {
Packit df99a1
              slo[sp]=h1+1;
Packit df99a1
              shi[sp]=hi;
Packit df99a1
              if (slo[sp] < shi[sp])  
Packit df99a1
                sp++;
Packit df99a1
            }
Packit df99a1
        }
Packit df99a1
    }
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
// GTD -- compare suffixes using data information 
Packit df99a1
//  (up to depth PRESORT_DEPTH)
Packit df99a1
Packit df99a1
inline int 
Packit df99a1
_BSort::GTD(int p1, int p2, int depth)
Packit df99a1
{
Packit df99a1
  unsigned char c1, c2;
Packit df99a1
  p1+=depth; p2+=depth;
Packit df99a1
  while (depth < PRESORT_DEPTH)
Packit df99a1
    {
Packit df99a1
      // Perform two
Packit df99a1
      c1=data[p1]; c2=data[p2];
Packit df99a1
      if (c1!=c2) 
Packit df99a1
        return (c1>c2);
Packit df99a1
      c1=data[p1+1]; c2=data[p2+1];
Packit df99a1
      p1+=2;  p2+=2; depth+=2;
Packit df99a1
      if (c1!=c2) 
Packit df99a1
        return (c1>c2);
Packit df99a1
    }
Packit df99a1
  if (p1
Packit df99a1
    return 0;
Packit df99a1
  return (p1
Packit df99a1
}
Packit df99a1
Packit df99a1
// pivot3d -- return suitable pivot
Packit df99a1
Packit df99a1
inline unsigned char
Packit df99a1
_BSort::pivot3d(unsigned char *rr, int lo, int hi)
Packit df99a1
{
Packit df99a1
  unsigned char c1, c2, c3;
Packit df99a1
  if (hi-lo > 256)
Packit df99a1
    {
Packit df99a1
      c1 = pivot3d(rr, lo, (6*lo+2*hi)/8);
Packit df99a1
      c2 = pivot3d(rr, (5*lo+3*hi)/8, (3*lo+5*hi)/8);
Packit df99a1
      c3 = pivot3d(rr, (2*lo+6*hi)/8, hi);
Packit df99a1
    }
Packit df99a1
  else
Packit df99a1
    {
Packit df99a1
      c1 = rr[posn[lo]];
Packit df99a1
      c2 = rr[posn[(lo+hi)/2]];
Packit df99a1
      c3 = rr[posn[hi]];
Packit df99a1
    }
Packit df99a1
  // Extract median
Packit df99a1
  if (c1>c3)
Packit df99a1
    { int tmp=c1; c1=c3; c3=tmp; }
Packit df99a1
  if (c2<=c1)
Packit df99a1
    return c1;
Packit df99a1
  else if (c2>=c3)
Packit df99a1
    return c3;
Packit df99a1
  else
Packit df99a1
    return c2;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::quicksort3d -- Three way quicksort algorithm 
Packit df99a1
//    Sort suffixes based on strings until reaching
Packit df99a1
//    depth rank at pos+depth
Packit df99a1
//    The algorithm breaks into ranksort when size is 
Packit df99a1
//    smaller than PRESORT_THRESH
Packit df99a1
Packit df99a1
void 
Packit df99a1
_BSort::quicksort3d(int lo, int hi, int depth)
Packit df99a1
{
Packit df99a1
  /* Initialize stack */
Packit df99a1
  int slo[QUICKSORT_STACK];
Packit df99a1
  int shi[QUICKSORT_STACK];
Packit df99a1
  int sd[QUICKSORT_STACK];
Packit df99a1
  int sp = 1;
Packit df99a1
  slo[0] = lo;
Packit df99a1
  shi[0] = hi;
Packit df99a1
  sd[0] = depth;
Packit df99a1
  // Recursion elimination loop
Packit df99a1
  while (--sp>=0)
Packit df99a1
    {
Packit df99a1
      lo = slo[sp];
Packit df99a1
      hi = shi[sp];
Packit df99a1
      depth = sd[sp];
Packit df99a1
      // Test for insertion sort
Packit df99a1
      if (depth >= PRESORT_DEPTH)
Packit df99a1
        {
Packit df99a1
          for (int i=lo; i<=hi; i++)
Packit df99a1
            rank[posn[i]] = hi;
Packit df99a1
        }
Packit df99a1
      else if (hi-lo
Packit df99a1
        {
Packit df99a1
          int i,j;
Packit df99a1
          for (i=lo+1; i<=hi; i++)
Packit df99a1
            {
Packit df99a1
              int tmp = posn[i];
Packit df99a1
              for(j=i-1; j>=lo && GTD(posn[j], tmp, depth); j--)
Packit df99a1
                posn[j+1] = posn[j];
Packit df99a1
              posn[j+1] = tmp;
Packit df99a1
            }
Packit df99a1
          for(i=hi;i>=lo;i=j)
Packit df99a1
            {
Packit df99a1
              int tmp = posn[i];
Packit df99a1
              rank[tmp] = i;
Packit df99a1
              for (j=i-1; j>=lo && !GTD(tmp,posn[j],depth); j--)
Packit df99a1
                rank[posn[j]] = i;
Packit df99a1
            }
Packit df99a1
        }
Packit df99a1
        else
Packit df99a1
        {
Packit df99a1
          int tmp;
Packit df99a1
          unsigned char *dd=data+depth;
Packit df99a1
          unsigned char med = pivot3d(dd,lo,hi);
Packit df99a1
          // -- positions are organized as follows:
Packit df99a1
          //   [lo..l1[ [l1..l[ ]h..h1] ]h1..hi]
Packit df99a1
          //      =        <       >        =
Packit df99a1
          int l1 = lo;
Packit df99a1
          int h1 = hi;
Packit df99a1
          while (dd[posn[l1]]==med && l1
Packit df99a1
          while (dd[posn[h1]]==med && l1
Packit df99a1
          int l = l1;
Packit df99a1
          int h = h1;
Packit df99a1
          // -- partition set
Packit df99a1
          for (;;)
Packit df99a1
            {
Packit df99a1
              while (l<=h)
Packit df99a1
                {
Packit df99a1
                  int c = (int)dd[posn[l]] - (int)med;
Packit df99a1
                  if (c > 0) break;
Packit df99a1
                  if (c == 0) { tmp=posn[l]; posn[l]=posn[l1]; posn[l1++]=tmp; }
Packit df99a1
                  l++;
Packit df99a1
                }
Packit df99a1
              while (l<=h)
Packit df99a1
                {
Packit df99a1
                  int c = (int)dd[posn[h]] - (int)med;
Packit df99a1
                  if (c < 0) break;
Packit df99a1
                  if (c == 0) { tmp=posn[h]; posn[h]=posn[h1]; posn[h1--]=tmp; }
Packit df99a1
                  h--;
Packit df99a1
                }
Packit df99a1
              if (l>h) break;
Packit df99a1
              tmp=posn[l]; posn[l]=posn[h]; posn[h]=tmp;
Packit df99a1
            }
Packit df99a1
          // -- reorganize as follows
Packit df99a1
          //   [lo..l1[ [l1..h1] ]h1..hi]
Packit df99a1
          //      <        =        > 
Packit df99a1
          tmp = mini(l1-lo, l-l1);
Packit df99a1
          vswap(lo, l-tmp, tmp, posn);
Packit df99a1
          l1 = lo + (l-l1);
Packit df99a1
          tmp = mini(hi-h1, h1-h);
Packit df99a1
          vswap(hi-tmp+1, h+1, tmp, posn);
Packit df99a1
          h1 = hi - (h1-h);
Packit df99a1
          // -- process segments
Packit df99a1
          ASSERT(sp+3
Packit df99a1
          // ----- middle segment (=?) [l1, h1]
Packit df99a1
          l = l1; h = h1;
Packit df99a1
          if (med==0) // special case for marker [slow]
Packit df99a1
            for (int i=l; i<=h; i++)
Packit df99a1
              if ((int)posn[i]+depth == size-1)
Packit df99a1
                { 
Packit df99a1
                  tmp=posn[i]; posn[i]=posn[l]; posn[l]=tmp; 
Packit df99a1
                  rank[tmp]=l++; break; 
Packit df99a1
                }
Packit df99a1
          if (l
Packit df99a1
            { slo[sp] = l; shi[sp] = h; sd[sp++] = depth+1; }
Packit df99a1
          else if (l==h)
Packit df99a1
            { rank[posn[h]] = h; }
Packit df99a1
          // ----- lower segment (<) [lo, l1[
Packit df99a1
          l = lo;
Packit df99a1
          h = l1-1;
Packit df99a1
          if (l
Packit df99a1
            { slo[sp] = l; shi[sp] = h; sd[sp++] = depth; }
Packit df99a1
          else if (l==h)
Packit df99a1
            { rank[posn[h]] = h; }
Packit df99a1
          // ----- upper segment (>) ]h1, hi]
Packit df99a1
          l = h1+1;
Packit df99a1
          h = hi;
Packit df99a1
          if (l
Packit df99a1
            { slo[sp] = l; shi[sp] = h; sd[sp++] = depth; }
Packit df99a1
          else if (l==h)
Packit df99a1
            { rank[posn[h]] = h; }
Packit df99a1
        }
Packit df99a1
    }
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::radixsort8 -- 8 bit radix sort
Packit df99a1
Packit df99a1
void 
Packit df99a1
_BSort::radixsort8(void)
Packit df99a1
{
Packit df99a1
  int i;
Packit df99a1
  // Initialize frequency array
Packit df99a1
  int lo[256], hi[256];
Packit df99a1
  for (i=0; i<256; i++)
Packit df99a1
    hi[i] = lo[i] = 0;
Packit df99a1
  // Count occurences
Packit df99a1
  for (i=0; i
Packit df99a1
    hi[data[i]] ++;
Packit df99a1
  // Compute positions (lo)
Packit df99a1
  int last = 1;
Packit df99a1
  for (i=0; i<256; i++)
Packit df99a1
    {
Packit df99a1
      lo[i] = last;
Packit df99a1
      hi[i] = last + hi[i] - 1;
Packit df99a1
      last = hi[i] + 1;
Packit df99a1
    }
Packit df99a1
  for (i=0; i
Packit df99a1
    {
Packit df99a1
      posn[ lo[data[i]]++ ] = i;
Packit df99a1
      rank[ i ] = hi[data[i]];
Packit df99a1
    }
Packit df99a1
  // Process marker "$"
Packit df99a1
  posn[0] = size-1;
Packit df99a1
  rank[size-1] = 0;
Packit df99a1
  // Extra element
Packit df99a1
  rank[size] = -1;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::radixsort16 -- 16 bit radix sort
Packit df99a1
Packit df99a1
void 
Packit df99a1
_BSort::radixsort16(void)
Packit df99a1
{
Packit df99a1
  int i;
Packit df99a1
  // Initialize frequency array
Packit df99a1
  int *ftab;
Packit df99a1
  GPBuffer<int> gftab(ftab,65536);
Packit df99a1
  for (i=0; i<65536; i++)
Packit df99a1
    ftab[i] = 0;
Packit df99a1
  // Count occurences
Packit df99a1
  unsigned char c1 = data[0];
Packit df99a1
  for (i=0; i
Packit df99a1
    {
Packit df99a1
      unsigned char c2 = data[i+1];
Packit df99a1
      ftab[(c1<<8)|c2] ++;
Packit df99a1
      c1 = c2;
Packit df99a1
    }
Packit df99a1
  // Generate upper position
Packit df99a1
  for (i=1;i<65536;i++)
Packit df99a1
    ftab[i] += ftab[i-1];
Packit df99a1
  // Fill rank array with upper bound
Packit df99a1
  c1 = data[0];
Packit df99a1
  for (i=0; i
Packit df99a1
    {
Packit df99a1
      unsigned char c2 = data[i+1];
Packit df99a1
      rank[i] = ftab[(c1<<8)|c2];
Packit df99a1
      c1 = c2;
Packit df99a1
    }
Packit df99a1
  // Fill posn array (backwards)
Packit df99a1
  c1 = data[size-2];
Packit df99a1
  for (i=size-3; i>=0; i--)
Packit df99a1
    {
Packit df99a1
      unsigned char c2 = data[i];
Packit df99a1
      posn[ ftab[(c2<<8)|c1]-- ] = i;
Packit df99a1
      c1 = c2;
Packit df99a1
    }
Packit df99a1
  // Fixup marker stuff
Packit df99a1
  ASSERT(data[size-1]==0);
Packit df99a1
  c1 = data[size-2];
Packit df99a1
  posn[0] = size-1;
Packit df99a1
  posn[ ftab[(c1<<8)] ] = size-2;
Packit df99a1
  rank[size-1] = 0;
Packit df99a1
  rank[size-2] = ftab[(c1<<8)];
Packit df99a1
  // Extra element
Packit df99a1
  rank[size] = -1;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
Packit df99a1
// _BSort::run -- main sort loop
Packit df99a1
Packit df99a1
void
Packit df99a1
_BSort::run(int &markerpos)
Packit df99a1
{
Packit df99a1
  int lo, hi;
Packit df99a1
  ASSERT(size>0);
Packit df99a1
  ASSERT(data[size-1]==0);
Packit df99a1
#ifdef BSORT_TIMER
Packit df99a1
  long start = GOS::ticks();
Packit df99a1
#endif  
Packit df99a1
  // Step 1: Radix sort 
Packit df99a1
  int depth = 0;
Packit df99a1
  if (size > RADIX_THRESH)
Packit df99a1
    { 
Packit df99a1
      radixsort16();
Packit df99a1
      depth=2;
Packit df99a1
    }
Packit df99a1
  else
Packit df99a1
    { 
Packit df99a1
      radixsort8(); 
Packit df99a1
      depth=1;
Packit df99a1
    }
Packit df99a1
  // Step 2: Perform presort to depth PRESORT_DEPTH
Packit df99a1
  for (lo=0; lo
Packit df99a1
    {
Packit df99a1
      hi = rank[posn[lo]];
Packit df99a1
      if (lo < hi)
Packit df99a1
        quicksort3d(lo, hi, depth);
Packit df99a1
      lo = hi;
Packit df99a1
    }
Packit df99a1
  depth = PRESORT_DEPTH;
Packit df99a1
#ifdef BSORT_TIMER
Packit df99a1
  long middle = GOS::ticks();
Packit df99a1
#endif  
Packit df99a1
  // Step 3: Perform rank doubling
Packit df99a1
  int again = 1;
Packit df99a1
  while (again)
Packit df99a1
    {
Packit df99a1
      again = 0;
Packit df99a1
      int sorted_lo = 0;
Packit df99a1
      for (lo=0; lo
Packit df99a1
        {
Packit df99a1
          hi = rank[posn[lo]&0xffffff];
Packit df99a1
          if (lo == hi)
Packit df99a1
            {
Packit df99a1
              lo += (posn[lo]>>24) & 0xff;
Packit df99a1
            }
Packit df99a1
          else
Packit df99a1
            {
Packit df99a1
              if (hi-lo < RANKSORT_THRESH)
Packit df99a1
                {
Packit df99a1
                  ranksort(lo, hi, depth);
Packit df99a1
                }
Packit df99a1
              else
Packit df99a1
                {
Packit df99a1
                  again += 1;
Packit df99a1
                  while (sorted_lo < lo-1)
Packit df99a1
                    {
Packit df99a1
                      int step = mini(255, lo-1-sorted_lo);
Packit df99a1
                      posn[sorted_lo] = (posn[sorted_lo]&0xffffff) | (step<<24);
Packit df99a1
                      sorted_lo += step+1;
Packit df99a1
                    }
Packit df99a1
                  quicksort3r(lo, hi, depth);
Packit df99a1
                  sorted_lo = hi + 1;
Packit df99a1
                }
Packit df99a1
              lo = hi;
Packit df99a1
            }
Packit df99a1
        }
Packit df99a1
      // Finish threading
Packit df99a1
      while (sorted_lo < lo-1)
Packit df99a1
        {
Packit df99a1
          int step = mini(255, lo-1-sorted_lo);
Packit df99a1
          posn[sorted_lo] = (posn[sorted_lo]&0xffffff) | (step<<24);
Packit df99a1
          sorted_lo += step+1;
Packit df99a1
        }
Packit df99a1
      // Double depth
Packit df99a1
      depth += depth;
Packit df99a1
    }
Packit df99a1
  // Step 4: Permute data
Packit df99a1
  int i;
Packit df99a1
  markerpos = -1;
Packit df99a1
  for (i=0; i
Packit df99a1
    rank[i] = data[i];
Packit df99a1
  for (i=0; i
Packit df99a1
    {
Packit df99a1
      int j = posn[i] & 0xffffff;
Packit df99a1
      if (j>0) 
Packit df99a1
        { 
Packit df99a1
          data[i] = rank[j-1];
Packit df99a1
        } 
Packit df99a1
      else 
Packit df99a1
        {
Packit df99a1
          data[i] = 0;
Packit df99a1
          markerpos = i;
Packit df99a1
        }
Packit df99a1
    }
Packit df99a1
  ASSERT(markerpos>=0 && markerpos
Packit df99a1
#ifdef BSORT_TIMER
Packit df99a1
  long end = GOS::ticks();
Packit df99a1
  DjVuPrintErrorUTF8("Sorting time: %d bytes in %ld + %ld = %ld ms\n", 
Packit df99a1
          size-1, middle-start, end-middle, end-start);
Packit df99a1
#endif  
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// -- Encoding
Packit df99a1
Packit df99a1
static void
Packit df99a1
encode_raw(ZPCodec &zp, int bits, int x)
Packit df99a1
{
Packit df99a1
  int n = 1;
Packit df99a1
  int m = (1<
Packit df99a1
  while (n < m)
Packit df99a1
    {
Packit df99a1
      x = (x & (m-1)) << 1;
Packit df99a1
      int b = (x >> bits);
Packit df99a1
      zp.encoder(b);
Packit df99a1
      n = (n<<1) | b;
Packit df99a1
    }
Packit df99a1
}
Packit df99a1
Packit df99a1
static inline void
Packit df99a1
encode_binary(ZPCodec &zp, BitContext *ctx, int bits, int x)
Packit df99a1
{
Packit df99a1
  // Require 2^bits-1  contexts
Packit df99a1
  int n = 1;
Packit df99a1
  int m = (1<
Packit df99a1
  ctx = ctx - 1;
Packit df99a1
  while (n < m)
Packit df99a1
    {
Packit df99a1
      x = (x & (m-1)) << 1;
Packit df99a1
      int b = (x >> bits);
Packit df99a1
      zp.encoder(b, ctx[n]);
Packit df99a1
      n = (n<<1) | b;
Packit df99a1
    }
Packit df99a1
}
Packit df99a1
Packit df99a1
class BSByteStream::Encode : public BSByteStream
Packit df99a1
{
Packit df99a1
public:
Packit df99a1
  /** Creates a Static object for allocating the memory area of
Packit df99a1
      length #sz# starting at address #buffer#. */
Packit df99a1
  Encode(GP<ByteStream> bs);
Packit df99a1
  ~Encode();
Packit df99a1
  void init(const int encoding);
Packit df99a1
  // Virtual functions
Packit df99a1
  virtual size_t write(const void *buffer, size_t sz);
Packit df99a1
  virtual void flush(void);
Packit df99a1
protected:
Packit df99a1
  unsigned int encode(void);
Packit df99a1
};
Packit df99a1
Packit df99a1
unsigned int
Packit df99a1
BSByteStream::Encode::encode()
Packit df99a1
{ 
Packit df99a1
  /////////////////////////////////
Packit df99a1
  ////////////  Block Sort Tranform
Packit df99a1
Packit df99a1
  int markerpos = size-1;
Packit df99a1
  blocksort(data,size,markerpos);
Packit df99a1
Packit df99a1
  /////////////////////////////////
Packit df99a1
  //////////// Encode Output Stream
Packit df99a1
Packit df99a1
  // Header
Packit df99a1
  ZPCodec &zp=*gzp;
Packit df99a1
  encode_raw(zp, 24, size);
Packit df99a1
  // Determine and Encode Estimation Speed
Packit df99a1
  int fshift = 0;
Packit df99a1
  if (size < FREQS0)
Packit df99a1
    { fshift=0; zp.encoder(0); }
Packit df99a1
  else if (size < FREQS1)
Packit df99a1
    { fshift = 1; zp.encoder(1); zp.encoder(0); }
Packit df99a1
  else
Packit df99a1
    { fshift = 2; zp.encoder(1); zp.encoder(1); }
Packit df99a1
  // MTF
Packit df99a1
  unsigned char mtf[256];
Packit df99a1
  unsigned char rmtf[256];
Packit df99a1
  unsigned int  freq[FREQMAX];
Packit df99a1
  int m = 0;
Packit df99a1
  for (m=0; m<256; m++)
Packit df99a1
    mtf[m] = m;
Packit df99a1
  for (m=0; m<256; m++)
Packit df99a1
    rmtf[mtf[m]] = m;
Packit df99a1
  int fadd = 4;
Packit df99a1
  for (m=0; m
Packit df99a1
    freq[m] = 0;
Packit df99a1
  // Encode
Packit df99a1
  int i;
Packit df99a1
  int mtfno = 3;
Packit df99a1
  for (i=0; i
Packit df99a1
    {
Packit df99a1
      // Get MTF data
Packit df99a1
      int c = data[i];
Packit df99a1
      int ctxid = CTXIDS-1;
Packit df99a1
      if (ctxid>mtfno) ctxid=mtfno;
Packit df99a1
      mtfno = rmtf[c];
Packit df99a1
      if (i==markerpos)
Packit df99a1
        mtfno = 256;
Packit df99a1
      // Encode using ZPCoder
Packit df99a1
      int b;
Packit df99a1
      BitContext *cx = ctx;
Packit df99a1
      b = (mtfno==0);
Packit df99a1
      zp.encoder(b, cx[ctxid]);
Packit df99a1
      if (b) goto rotate; cx+=CTXIDS;
Packit df99a1
      b = (mtfno==1);
Packit df99a1
      zp.encoder(b, cx[ctxid]);
Packit df99a1
      if (b) goto rotate; cx+=CTXIDS;
Packit df99a1
      b = (mtfno<4);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,1,mtfno-2); goto rotate; } 
Packit df99a1
      cx+=1+1;
Packit df99a1
      b = (mtfno<8);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,2,mtfno-4); goto rotate; } 
Packit df99a1
      cx+=1+3;
Packit df99a1
      b = (mtfno<16);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,3,mtfno-8); goto rotate; } 
Packit df99a1
      cx+=1+7;
Packit df99a1
      b = (mtfno<32);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,4,mtfno-16); goto rotate; } 
Packit df99a1
      cx+=1+15;
Packit df99a1
      b = (mtfno<64);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,5,mtfno-32); goto rotate; } 
Packit df99a1
      cx+=1+31;
Packit df99a1
      b = (mtfno<128);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,6,mtfno-64); goto rotate; } 
Packit df99a1
      cx+=1+63;
Packit df99a1
      b = (mtfno<256);
Packit df99a1
      zp.encoder(b, cx[0]);
Packit df99a1
      if (b) { encode_binary(zp,cx+1,7,mtfno-128); goto rotate; } 
Packit df99a1
      continue;
Packit df99a1
      // Rotate MTF according to empirical frequencies (new!)
Packit df99a1
    rotate:
Packit df99a1
      // Adjust frequencies for overflow
Packit df99a1
      fadd = fadd + (fadd>>fshift);
Packit df99a1
      if (fadd > 0x10000000) 
Packit df99a1
        {
Packit df99a1
          fadd = fadd>>24;
Packit df99a1
          freq[0] >>= 24;
Packit df99a1
          freq[1] >>= 24;
Packit df99a1
          freq[2] >>= 24;
Packit df99a1
          freq[3] >>= 24;
Packit df99a1
          for (int k=4; k
Packit df99a1
            freq[k] = freq[k]>>24;
Packit df99a1
        }
Packit df99a1
      // Relocate new char according to new freq
Packit df99a1
      unsigned int fc = fadd;
Packit df99a1
      if (mtfno < FREQMAX)
Packit df99a1
        fc += freq[mtfno];
Packit df99a1
      int k;
Packit df99a1
      for (k=mtfno; k>=FREQMAX; k--)
Packit df99a1
        {
Packit df99a1
          mtf[k] = mtf[k-1];
Packit df99a1
          rmtf[mtf[k]] = k;
Packit df99a1
        }
Packit df99a1
      for (; k>0 && fc>=freq[k-1]; k--)
Packit df99a1
        {
Packit df99a1
          mtf[k] = mtf[k-1];
Packit df99a1
          freq[k] = freq[k-1];
Packit df99a1
          rmtf[mtf[k]] = k;
Packit df99a1
        }
Packit df99a1
      mtf[k] = c;
Packit df99a1
      freq[k] = fc;
Packit df99a1
      rmtf[mtf[k]] = k;
Packit df99a1
    }
Packit df99a1
  // Terminate
Packit df99a1
  return 0;
Packit df99a1
}
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// --- Construction
Packit df99a1
Packit df99a1
BSByteStream::Encode::Encode(GP<ByteStream> xbs)
Packit df99a1
: BSByteStream(xbs) {}
Packit df99a1
Packit df99a1
void
Packit df99a1
BSByteStream::Encode::init(const int xencoding)
Packit df99a1
{
Packit df99a1
  gzp=ZPCodec::create(gbs,true,true);
Packit df99a1
  const int encoding=(xencoding
Packit df99a1
  if (encoding > MAXBLOCK)
Packit df99a1
    G_THROW( ERR_MSG("ByteStream.blocksize") "\t" + GUTF8String(MAXBLOCK) );
Packit df99a1
  // Record block size
Packit df99a1
  blocksize = encoding * 1024;
Packit df99a1
  // Initialize context array
Packit df99a1
}
Packit df99a1
Packit df99a1
BSByteStream::Encode::~Encode()
Packit df99a1
{
Packit df99a1
  // Flush
Packit df99a1
  flush();
Packit df99a1
  // Encode EOF marker
Packit df99a1
  encode_raw(*gzp, 24, 0);
Packit df99a1
  // Free allocated memory
Packit df99a1
}
Packit df99a1
Packit df99a1
GP<ByteStream>
Packit df99a1
BSByteStream::create(GP<ByteStream> xbs,const int blocksize)
Packit df99a1
{
Packit df99a1
  BSByteStream::Encode *rbs=new BSByteStream::Encode(xbs);
Packit df99a1
  GP<ByteStream> retval=rbs;
Packit df99a1
  rbs->init(blocksize);
Packit df99a1
  return retval;
Packit df99a1
}
Packit df99a1
Packit df99a1
// ========================================
Packit df99a1
// -- ByteStream interface
Packit df99a1
Packit df99a1
void 
Packit df99a1
BSByteStream::Encode::flush()
Packit df99a1
{
Packit df99a1
  if (bptr>0)
Packit df99a1
  {
Packit df99a1
    ASSERT(bptr<(int)blocksize);
Packit df99a1
    memset(data+bptr, 0, OVERFLOW);
Packit df99a1
    size = bptr+1;
Packit df99a1
    encode();
Packit df99a1
  }
Packit df99a1
  size = bptr = 0;
Packit df99a1
}
Packit df99a1
Packit df99a1
size_t 
Packit df99a1
BSByteStream::Encode::write(const void *buffer, size_t sz)
Packit df99a1
{
Packit df99a1
  // Trivial checks
Packit df99a1
  if (sz == 0)
Packit df99a1
    return 0;
Packit df99a1
  // Loop
Packit df99a1
  int copied = 0;
Packit df99a1
  while (sz > 0)
Packit df99a1
    {
Packit df99a1
      // Initialize
Packit df99a1
      if (!data) 
Packit df99a1
        {
Packit df99a1
          bptr = 0;
Packit df99a1
          gdata.resize(blocksize+OVERFLOW);
Packit df99a1
        }
Packit df99a1
      // Compute remaining
Packit df99a1
      int bytes = blocksize - 1 - bptr;
Packit df99a1
      if (bytes > (int)sz)
Packit df99a1
        bytes = sz;
Packit df99a1
      // Store date (todo: rle)
Packit df99a1
      memcpy(data+bptr, buffer, bytes);
Packit df99a1
      buffer = (void*)((char*)buffer + bytes);
Packit df99a1
      bptr += bytes;
Packit df99a1
      sz -= bytes;
Packit df99a1
      copied += bytes;
Packit df99a1
      offset += bytes;
Packit df99a1
      // Flush when needed
Packit df99a1
      if (bptr + 1 >= (int)blocksize)
Packit df99a1
        flush();
Packit df99a1
    }
Packit df99a1
  // return
Packit df99a1
  return copied;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
#ifdef HAVE_NAMESPACES
Packit df99a1
}
Packit df99a1
# ifndef NOT_USING_DJVU_NAMESPACE
Packit df99a1
using namespace DJVU;
Packit df99a1
# endif
Packit df99a1
#endif