Blame tools/djvuserve.cpp

Packit df99a1
//C-  -*- C++ -*-
Packit df99a1
//C- -------------------------------------------------------------------
Packit df99a1
//C- DjVuLibre-3.5
Packit df99a1
//C- Copyright (c) 2002  Leon Bottou and Yann Le Cun.
Packit df99a1
//C- Copyright (c) 2001  AT&T
Packit df99a1
//C-
Packit df99a1
//C- This software is subject to, and may be distributed under, the
Packit df99a1
//C- GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- or (at your option) any later version. The license should have
Packit df99a1
//C- accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C-
Packit df99a1
//C- This program is distributed in the hope that it will be useful,
Packit df99a1
//C- but WITHOUT ANY WARRANTY; without even the implied warranty of
Packit df99a1
//C- MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.  See the
Packit df99a1
//C- GNU General Public License for more details.
Packit df99a1
//C- 
Packit df99a1
//C- DjVuLibre-3.5 is derived from the DjVu(r) Reference Library from
Packit df99a1
//C- Lizardtech Software.  Lizardtech Software has authorized us to
Packit df99a1
//C- replace the original DjVu(r) Reference Library notice by the following
Packit df99a1
//C- text (see doc/lizard2002.djvu and doc/lizardtech2007.djvu):
Packit df99a1
//C-
Packit df99a1
//C-  ------------------------------------------------------------------
Packit df99a1
//C- | DjVu (r) Reference Library (v. 3.5)
Packit df99a1
//C- | Copyright (c) 1999-2001 LizardTech, Inc. All Rights Reserved.
Packit df99a1
//C- | The DjVu Reference Library is protected by U.S. Pat. No.
Packit df99a1
//C- | 6,058,214 and patents pending.
Packit df99a1
//C- |
Packit df99a1
//C- | This software is subject to, and may be distributed under, the
Packit df99a1
//C- | GNU General Public License, either Version 2 of the license,
Packit df99a1
//C- | or (at your option) any later version. The license should have
Packit df99a1
//C- | accompanied the software or you may obtain a copy of the license
Packit df99a1
//C- | from the Free Software Foundation at http://www.fsf.org .
Packit df99a1
//C- |
Packit df99a1
//C- | The computer code originally released by LizardTech under this
Packit df99a1
//C- | license and unmodified by other parties is deemed "the LIZARDTECH
Packit df99a1
//C- | ORIGINAL CODE."  Subject to any third party intellectual property
Packit df99a1
//C- | claims, LizardTech grants recipient a worldwide, royalty-free, 
Packit df99a1
//C- | non-exclusive license to make, use, sell, or otherwise dispose of 
Packit df99a1
//C- | the LIZARDTECH ORIGINAL CODE or of programs derived from the 
Packit df99a1
//C- | LIZARDTECH ORIGINAL CODE in compliance with the terms of the GNU 
Packit df99a1
//C- | General Public License.   This grant only confers the right to 
Packit df99a1
//C- | infringe patent claims underlying the LIZARDTECH ORIGINAL CODE to 
Packit df99a1
//C- | the extent such infringement is reasonably necessary to enable 
Packit df99a1
//C- | recipient to make, have made, practice, sell, or otherwise dispose 
Packit df99a1
//C- | of the LIZARDTECH ORIGINAL CODE (or portions thereof) and not to 
Packit df99a1
//C- | any greater extent that may be necessary to utilize further 
Packit df99a1
//C- | modifications or combinations.
Packit df99a1
//C- |
Packit df99a1
//C- | The LIZARDTECH ORIGINAL CODE is provided "AS IS" WITHOUT WARRANTY
Packit df99a1
//C- | OF ANY KIND, EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED
Packit df99a1
//C- | TO ANY WARRANTY OF NON-INFRINGEMENT, OR ANY IMPLIED WARRANTY OF
Packit df99a1
//C- | MERCHANTABILITY OR FITNESS FOR A PARTICULAR PURPOSE.
Packit df99a1
//C- +------------------------------------------------------------------
Packit df99a1
Packit df99a1
#ifdef HAVE_CONFIG_H
Packit df99a1
# include "config.h"
Packit df99a1
#endif
Packit df99a1
#if NEED_GNUG_PRAGMAS
Packit df99a1
# pragma implementation
Packit df99a1
#endif
Packit df99a1
Packit df99a1
#include "DjVuDocument.h"
Packit df99a1
#include "DjVmDir.h"
Packit df99a1
#include "ByteStream.h"
Packit df99a1
#include "IFFByteStream.h"
Packit df99a1
#include "DjVuText.h"
Packit df99a1
#include "DjVuImage.h"
Packit df99a1
#include "GString.h"
Packit df99a1
#include "GOS.h"
Packit df99a1
#include "GURL.h"
Packit df99a1
#include "DjVuMessage.h"
Packit df99a1
Packit df99a1
#include "common.h"
Packit df99a1
Packit df99a1
#include <sys/stat.h>
Packit df99a1
#include <time.h>
Packit df99a1
Packit df99a1
Packit df99a1
static bool cgi = false;
Packit df99a1
static bool head = false;
Packit df99a1
Packit df99a1
Packit df99a1
struct DJVUSERVEGlobal 
Packit df99a1
{
Packit df99a1
  // Globals that need static initialization
Packit df99a1
  // are grouped here to work around broken compilers.
Packit df99a1
  GUTF8String pathinfo;
Packit df99a1
  GUTF8String pathtranslated;
Packit df99a1
  GUTF8String requestmethod;
Packit df99a1
  GUTF8String querystring;
Packit df99a1
};
Packit df99a1
Packit df99a1
static DJVUSERVEGlobal& g(void)
Packit df99a1
{
Packit df99a1
  static DJVUSERVEGlobal g;
Packit df99a1
  return g;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
static void
Packit df99a1
usage(void)
Packit df99a1
{
Packit df99a1
   DjVuPrintErrorUTF8(
Packit df99a1
#ifdef DJVULIBRE_VERSION
Packit df99a1
          "DJVUSERVE --- DjVuLibre-" DJVULIBRE_VERSION "\n"
Packit df99a1
#endif
Packit df99a1
          "Extracts hidden text from Djvu files\n"
Packit df99a1
          "\n"
Packit df99a1
          "Usage: djvuserve [<djvufile>[/<djvmid>]\n"
Packit df99a1
          "Outputs the specified <djvufile> with valid Content-Type,\n"
Packit df99a1
          "Content-Length, and Expire HTTP headers.  Bundled multipage DjVu\n"
Packit df99a1
          "documents are accessed as indirect document using the <djvmid>\n"
Packit df99a1
          "syntax. Specifying a <djvmid> of <index> generates an indirect page\n"
Packit df99a1
          "directory pointing to the other component files.\n"
Packit df99a1
          "This program is designed to be used as a CGI executable.\n"
Packit df99a1
          "It uses environment variable PATH_TRANSLATED when executed\n"
Packit df99a1
          "without arguments.\n\n" );
Packit df99a1
   exit(10);
Packit df99a1
}
Packit df99a1
Packit df99a1
static const char * 
Packit df99a1
day_name(int d)
Packit df99a1
{
Packit df99a1
   static const char *n[] = {
Packit df99a1
     "Sun", "Mon", "Tue", "Wed", "Thu", "Fri", "Sat" 
Packit df99a1
   };
Packit df99a1
   if (d>=0 && d<7)
Packit df99a1
     return n[d];
Packit df99a1
   return "???";
Packit df99a1
}
Packit df99a1
Packit df99a1
static const char* 
Packit df99a1
month_name(int d)
Packit df99a1
{
Packit df99a1
   static const char *n[] = {
Packit df99a1
     "Jan", "Feb", "Mar", "Apr", "May", "Jun",
Packit df99a1
     "Jul", "Aug", "Sep", "Oct", "Nov", "Dec" 
Packit df99a1
   };
Packit df99a1
   if (d>=0 && d<12)
Packit df99a1
     return n[d];
Packit df99a1
   return "???";
Packit df99a1
}
Packit df99a1
Packit df99a1
void
Packit df99a1
fprintdate(FILE *f, const char *fmt, const time_t *tim)
Packit df99a1
{
Packit df99a1
  char ctim[128];
Packit df99a1
  struct tm *ttim = gmtime(tim);
Packit df99a1
  /* strftime(ctim, sizeof(ctim)-1, "%a, %d %b %Y %H:%M:%S GMT", ttim); */
Packit df99a1
  sprintf(ctim,"%3s, %02d %3s %04d %02d:%02d:%02d GMT",
Packit df99a1
	  day_name(ttim->tm_wday), ttim->tm_mday,
Packit df99a1
	  month_name(ttim->tm_mon), 1900+ttim->tm_year,
Packit df99a1
	  ttim->tm_hour, ttim->tm_min, ttim->tm_sec);
Packit df99a1
  fprintf(stdout, fmt, ctim);
Packit df99a1
}
Packit df99a1
Packit df99a1
void
Packit df99a1
headers(const struct stat *statbuf, const char *fname = 0)
Packit df99a1
{
Packit df99a1
  fprintf(stdout,"Content-Type: image/x.djvu\n");
Packit df99a1
  if (fname)
Packit df99a1
    fprintf(stdout,"Content-Disposition: attachment; filename=\"%s\"\n", fname);
Packit df99a1
  fprintf(stdout,"Content-Length: %ld\n", (long)statbuf->st_size);
Packit df99a1
  time_t tim = time(0) + 360 * 24 * 3600;
Packit df99a1
  fprintdate(stdout, "Last-Modified: %s\n", &statbuf->st_mtime);
Packit df99a1
  fprintdate(stdout, "Expires: %s\n", &tim);
Packit df99a1
}
Packit df99a1
Packit df99a1
bool
Packit df99a1
is_djvu_file_bundled(GURL &pathurl)
Packit df99a1
{
Packit df99a1
  GP<ByteStream> in = ByteStream::create(pathurl,"rb");
Packit df99a1
  GP<IFFByteStream> iff = IFFByteStream::create(in);
Packit df99a1
  GUTF8String chkid;
Packit df99a1
  iff->get_chunk(chkid);
Packit df99a1
  // Make sure that this is a DjVu file.
Packit df99a1
  if (chkid != "FORM:DJVU" &&
Packit df99a1
      chkid != "FORM:DJVM" &&
Packit df99a1
      chkid != "FORM:PM44" &&
Packit df99a1
      chkid != "FORM:BM44"   )
Packit df99a1
    G_THROW("Corrupted DjVu file");
Packit df99a1
  // Test if it is bundled
Packit df99a1
  if (chkid == "FORM:DJVM")
Packit df99a1
    {
Packit df99a1
      while (iff->get_chunk(chkid) && chkid!="DIRM")
Packit df99a1
        iff->close_chunk();
Packit df99a1
      if (chkid == "DIRM")
Packit df99a1
        {
Packit df99a1
          GP<ByteStream> dirm = iff->get_bytestream();
Packit df99a1
          if (dirm->read8() & 0x80)
Packit df99a1
            return true;
Packit df99a1
        }
Packit df99a1
    }
Packit df99a1
  return false;
Packit df99a1
}
Packit df99a1
Packit df99a1
void 
Packit df99a1
djvuserver_file(GURL pathurl, bool bundled, bool download)
Packit df99a1
{
Packit df99a1
  GNativeString fname = pathurl.NativeFilename();
Packit df99a1
  struct stat statbuf;
Packit df99a1
  if (stat((const char *)fname, &statbuf) < 0)
Packit df99a1
    G_THROW(strerror(errno));
Packit df99a1
  
Packit df99a1
  // Is this a bundled file?
Packit df99a1
  if (is_djvu_file_bundled(pathurl) && !bundled)
Packit df99a1
    {
Packit df99a1
      // It is bundled
Packit df99a1
      GUTF8String id = pathurl.name();
Packit df99a1
      fprintf(stdout,"Location: %s/index.djvu", (const char*)id);
Packit df99a1
      if (g().querystring.length())
Packit df99a1
        fprintf(stdout,"?%s", (const char*)g().querystring);
Packit df99a1
      fprintf(stdout,"\n\n");
Packit df99a1
      return;
Packit df99a1
    }
Packit df99a1
  // Push the file
Packit df99a1
  if (download)
Packit df99a1
    headers(&statbuf, pathurl.fname());
Packit df99a1
  else
Packit df99a1
    headers(&statbuf);
Packit df99a1
  if (head) 
Packit df99a1
    return;
Packit df99a1
  fprintf(stdout,"\n");
Packit df99a1
  fflush(stdout);
Packit df99a1
  GP<ByteStream> in = ByteStream::create(pathurl,"rb");
Packit df99a1
  GP<ByteStream> out = ByteStream::get_stdout("ab");
Packit df99a1
  out->copy(*in);
Packit df99a1
}
Packit df99a1
Packit df99a1
void 
Packit df99a1
djvuserver_directory(GURL pathurl)
Packit df99a1
{
Packit df99a1
  GNativeString fname = pathurl.NativeFilename();
Packit df99a1
  struct stat statbuf;
Packit df99a1
  if (stat((const char *)fname, &statbuf) < 0)
Packit df99a1
    G_THROW(strerror(errno));
Packit df99a1
  // Find the DIRM chunk directly (save time)
Packit df99a1
  GP<ByteStream> temp;
Packit df99a1
  GP<ByteStream> bsin = ByteStream::create(pathurl,"rb");
Packit df99a1
  GP<DjVmDir> dir = DjVmDir::create();
Packit df99a1
  {
Packit df99a1
    GP<IFFByteStream> iffin = IFFByteStream::create(bsin);
Packit df99a1
    GUTF8String chkid;
Packit df99a1
    iffin->get_chunk(chkid);
Packit df99a1
    if (chkid != "FORM:DJVM")
Packit df99a1
      G_THROW( "This is not a multipage DjVu document" );
Packit df99a1
    while (iffin->get_chunk(chkid) && chkid!="DIRM")
Packit df99a1
      iffin->close_chunk();
Packit df99a1
    if (chkid != "DIRM")
Packit df99a1
      G_THROW( "This is not a new style bundled DjVu document" );
Packit df99a1
    temp = iffin->get_bytestream();
Packit df99a1
    dir->decode(temp);
Packit df99a1
    if (! dir->is_bundled())
Packit df99a1
      G_THROW( "This is not a bundled DjVu document" );
Packit df99a1
  }
Packit df99a1
  // Assemble index of indirect multipage file
Packit df99a1
  GP<ByteStream> bsdir = ByteStream::create();
Packit df99a1
  {
Packit df99a1
    GP<IFFByteStream> iff = IFFByteStream::create(bsdir);
Packit df99a1
    iff->put_chunk("FORM:DJVM",1);
Packit df99a1
    iff->put_chunk("DIRM");
Packit df99a1
    temp = iff->get_bytestream();
Packit df99a1
    dir->encode(temp, false, false);
Packit df99a1
    iff->close_chunk();
Packit df99a1
    iff->close_chunk();
Packit df99a1
  }
Packit df99a1
  // HTTP output
Packit df99a1
  statbuf.st_size = bsdir->tell();
Packit df99a1
  headers(&statbuf);
Packit df99a1
  if (head) 
Packit df99a1
    return;
Packit df99a1
  bsdir->seek(0);
Packit df99a1
  fprintf(stdout,"\n");
Packit df99a1
  fflush(stdout);
Packit df99a1
  GP<ByteStream> out = ByteStream::get_stdout("ab");
Packit df99a1
  out->copy(*bsdir);
Packit df99a1
}
Packit df99a1
Packit df99a1
void 
Packit df99a1
djvuserver_component(GURL pathurl, GUTF8String id)
Packit df99a1
{
Packit df99a1
  GNativeString fname = pathurl.NativeFilename();
Packit df99a1
  struct stat statbuf;
Packit df99a1
  if (stat((const char *)fname, &statbuf) < 0)
Packit df99a1
    G_THROW(strerror(errno));
Packit df99a1
  // Find the DIRM chunk directly (save time)
Packit df99a1
  GP<ByteStream> temp;
Packit df99a1
  GP<ByteStream> bsin = ByteStream::create(pathurl,"rb");
Packit df99a1
  GP<DjVmDir> dir = DjVmDir::create();
Packit df99a1
  {
Packit df99a1
    GP<IFFByteStream> iffin = IFFByteStream::create(bsin);
Packit df99a1
    GUTF8String chkid;
Packit df99a1
    iffin->get_chunk(chkid);
Packit df99a1
    if (chkid != "FORM:DJVM")
Packit df99a1
      G_THROW( "This is not a multipage DjVu document" );
Packit df99a1
    while (iffin->get_chunk(chkid) && chkid!="DIRM")
Packit df99a1
      iffin->close_chunk();
Packit df99a1
    if (chkid != "DIRM")
Packit df99a1
      G_THROW( "This is not a new style bundled DjVu document" );
Packit df99a1
    temp = iffin->get_bytestream();
Packit df99a1
    dir->decode(temp);
Packit df99a1
    if (! dir->is_bundled())
Packit df99a1
      G_THROW( "This is not a bundled DjVu document" );
Packit df99a1
  }
Packit df99a1
  // Find the file record
Packit df99a1
  GP<DjVmDir::File> frec = dir->id_to_file(id);
Packit df99a1
  if (!frec)
Packit df99a1
    G_THROW( "Cannot locate requested component file" );
Packit df99a1
  if (!frec->size || !frec->offset)
Packit df99a1
    G_THROW( "Corrupted DjVu directory" );
Packit df99a1
Packit df99a1
  // HTTP output
Packit df99a1
  statbuf.st_size = frec->size + 4;
Packit df99a1
  headers(&statbuf);
Packit df99a1
  if (head) 
Packit df99a1
    return;
Packit df99a1
  fprintf(stdout,"\n");
Packit df99a1
  fflush(stdout);
Packit df99a1
  GP<ByteStream> out = ByteStream::get_stdout("ab");
Packit df99a1
  out->writall("AT&T", 4);
Packit df99a1
  bsin->seek(frec->offset);
Packit df99a1
  out->copy(*bsin, frec->size);
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
bool
Packit df99a1
search_cgi_arg(const char *name)
Packit df99a1
{
Packit df99a1
  const char *s = g().querystring;
Packit df99a1
  int l = strlen(name);
Packit df99a1
  if (*s == '?')
Packit df99a1
    s += 1;
Packit df99a1
  while (*s)
Packit df99a1
    {
Packit df99a1
      if (! strncmp(s, name, l))
Packit df99a1
        if (s[l]=='&' || s[l]=='=' || s[l]==0)
Packit df99a1
          return true;
Packit df99a1
      while (*s && *s != '&')
Packit df99a1
        s += 1;
Packit df99a1
      if (*s == '&')
Packit df99a1
        s += 1;
Packit df99a1
    }
Packit df99a1
  return false;
Packit df99a1
}
Packit df99a1
Packit df99a1
Packit df99a1
int
Packit df99a1
main(int argc, char ** argv)
Packit df99a1
{
Packit df99a1
  DJVU_LOCALE;
Packit df99a1
  G_TRY 
Packit df99a1
    {
Packit df99a1
      // Obtain path
Packit df99a1
      bool bundled = false;
Packit df99a1
      bool download = false;
Packit df99a1
      if (argc == 1)
Packit df99a1
        {
Packit df99a1
          cgi = true;
Packit df99a1
          g().pathinfo = GNativeString(getenv("PATH_INFO"));
Packit df99a1
          g().pathtranslated = GNativeString(getenv("PATH_TRANSLATED"));
Packit df99a1
          if (! g().pathinfo)
Packit df99a1
            usage();
Packit df99a1
          if (! g().pathtranslated)
Packit df99a1
            G_THROW("No path information");
Packit df99a1
          g().requestmethod = GNativeString(getenv("REQUEST_METHOD"));
Packit df99a1
          g().querystring = GUTF8String(getenv("QUERY_STRING"));
Packit df99a1
          if (search_cgi_arg("bundled"))
Packit df99a1
            bundled = true;
Packit df99a1
          if (search_cgi_arg("download") || search_cgi_arg("bundle"))
Packit df99a1
            bundled = download = true;
Packit df99a1
        }
Packit df99a1
      else if (argc == 2)
Packit df99a1
        {
Packit df99a1
          cgi = false;
Packit df99a1
          g().pathtranslated = GNativeString(argv[1]);
Packit df99a1
          g().requestmethod = "GET";
Packit df99a1
        }
Packit df99a1
      if (! g().pathtranslated)
Packit df99a1
        usage();
Packit df99a1
      head = false;
Packit df99a1
      if (g().requestmethod == "HEAD")
Packit df99a1
        head = true;
Packit df99a1
      else if (g().requestmethod != "GET")
Packit df99a1
        G_THROW("Only serve HEAD and GET requests");
Packit df99a1
      // Do it.
Packit df99a1
      GURL pathurl = GURL::Filename::UTF8(g().pathtranslated);
Packit df99a1
      if (pathurl.is_file())
Packit df99a1
        {
Packit df99a1
          djvuserver_file(pathurl, bundled, download);
Packit df99a1
        }
Packit df99a1
      else
Packit df99a1
        {
Packit df99a1
          GUTF8String id = pathurl.name();
Packit df99a1
          pathurl = pathurl.base();
Packit df99a1
          if (! pathurl.is_file())
Packit df99a1
            G_THROW("File not found");
Packit df99a1
          if (id != "index" && id != "index.djvu")
Packit df99a1
            djvuserver_component(pathurl, id);
Packit df99a1
          else if (bundled)
Packit df99a1
            djvuserver_file(pathurl, bundled, download);
Packit df99a1
          else
Packit df99a1
            djvuserver_directory(pathurl);
Packit df99a1
        }
Packit df99a1
    }
Packit df99a1
  G_CATCH(ex)
Packit df99a1
    {
Packit df99a1
      if (cgi)
Packit df99a1
        {
Packit df99a1
          GUTF8String cause = DjVuMessageLite::LookUpUTF8(ex.get_cause());
Packit df99a1
          fprintf(stdout,"Status: 400 %s\n", (const char*)cause);
Packit df99a1
          fprintf(stdout,"Content-Type: text/html\n\n");
Packit df99a1
          fprintf(stdout,
Packit df99a1
                  "\n"
Packit df99a1
                  "<HTML><HEAD><TITLE>400 Error</TITLE></HEAD><BODY>\n"
Packit df99a1
                  "

%s

The requested URL '%s' cannot be processed.

\n"

Packit df99a1
#ifdef DJVULIBRE_VERSION
Packit df99a1
                  "
<ADDRESS>djvuserve/DjVuLibre-" DJVULIBRE_VERSION "</ADDRESS>\n"
Packit df99a1
#endif
Packit df99a1
                  "</BODY></HTML>\n",
Packit df99a1
                  (const char *) cause,
Packit df99a1
                  (const char *) g().pathinfo );
Packit df99a1
        }
Packit df99a1
      else
Packit df99a1
        {
Packit df99a1
          ex.perror();
Packit df99a1
        }
Packit df99a1
      exit(10);
Packit df99a1
    }
Packit df99a1
  G_ENDCATCH;
Packit df99a1
  // return code zero
Packit df99a1
  return 0;
Packit df99a1
}