pdfimages.cc 6.68 KB
Newer Older
1 2 3 4 5 6 7 8 9 10
//========================================================================
//
// pdfimages.cc
//
// Copyright 1998-2003 Glyph & Cog, LLC
//
// Modified for Debian by Hamish Moffatt, 22 May 2002.
//
//========================================================================

11 12 13 14
//========================================================================
//
// Modified under the Poppler project - http://poppler.freedesktop.org
//
15 16 17
// All changes made under the Poppler project to this file are licensed
// under GPL version 2 or later
//
18
// Copyright (C) 2007-2008, 2010, 2018 Albert Astals Cid <aacid@kde.org>
Hib Eris's avatar
Hib Eris committed
19
// Copyright (C) 2010 Hib Eris <hib@hiberis.nl>
Jakob Voss's avatar
Jakob Voss committed
20
// Copyright (C) 2010 Jakob Voss <jakob.voss@gbv.de>
21
// Copyright (C) 2012, 2013, 2017 Adrian Johnson <ajohnson@redneon.com>
22
// Copyright (C) 2013 Suzuki Toshiya <mpsuzuki@hiroshima-u.ac.jp>
23
// Copyright (C) 2018 Adam Reichold <adam.reichold@t-online.de>
24 25 26 27 28 29
//
// To see a description of the changes please see the Changelog file that
// came with your tarball or type make ChangeLog if you are building from git
//
//========================================================================

30
#include "config.h"
31 32 33 34 35 36 37 38 39 40 41 42 43 44 45 46 47
#include <poppler-config.h>
#include <stdio.h>
#include <stdlib.h>
#include <stddef.h>
#include <string.h>
#include "parseargs.h"
#include "goo/GooString.h"
#include "goo/gmem.h"
#include "GlobalParams.h"
#include "Object.h"
#include "Stream.h"
#include "Array.h"
#include "Dict.h"
#include "XRef.h"
#include "Catalog.h"
#include "Page.h"
#include "PDFDoc.h"
Hib Eris's avatar
Hib Eris committed
48
#include "PDFDocFactory.h"
49 50
#include "ImageOutputDev.h"
#include "Error.h"
51
#include "Win32Console.h"
52 53 54

static int firstPage = 1;
static int lastPage = 0;
55
static GBool listImages = gFalse;
56 57
static GBool enablePNG = gFalse;
static GBool enableTiff = gFalse;
58
static GBool dumpJPEG = gFalse;
59
static GBool dumpJP2 = gFalse;
60
static GBool dumpJBIG2 = gFalse;
61
static GBool dumpCCITT = gFalse;
62
static GBool allFormats = gFalse;
Jakob Voss's avatar
Jakob Voss committed
63
static GBool pageNames = gFalse;
64 65 66 67 68 69
static char ownerPassword[33] = "\001";
static char userPassword[33] = "\001";
static GBool quiet = gFalse;
static GBool printVersion = gFalse;
static GBool printHelp = gFalse;

70
static const ArgDesc argDesc[] = {
71 72 73 74
  {"-f",      argInt,      &firstPage,     0,
   "first page to convert"},
  {"-l",      argInt,      &lastPage,      0,
   "last page to convert"},
75
#ifdef ENABLE_LIBPNG
76 77 78
  {"-png",      argFlag,     &enablePNG,      0,
   "change the default output format to PNG"},
#endif
79
#ifdef ENABLE_LIBTIFF
80 81 82
  {"-tiff",      argFlag,     &enableTiff,      0,
   "change the default output format to TIFF"},
#endif
83 84
  {"-j",      argFlag,     &dumpJPEG,      0,
   "write JPEG images as JPEG files"},
85 86
  {"-jp2",      argFlag,     &dumpJP2,      0,
   "write JPEG2000 images as JP2 files"},
87 88
  {"-jbig2",      argFlag,     &dumpJBIG2,      0,
   "write JBIG2 images as JBIG2 files"},
89 90
  {"-ccitt",      argFlag,     &dumpCCITT,      0,
   "write CCITT images as CCITT files"},
91
  {"-all",      argFlag,     &allFormats,    0,
92
   "equivalent to -png -tiff -j -jp2 -jbig2 -ccitt"},
93 94
  {"-list",   argFlag,     &listImages,      0,
   "print list of images instead of saving"},
95 96 97 98
  {"-opw",    argString,   ownerPassword,  sizeof(ownerPassword),
   "owner password (for encrypted files)"},
  {"-upw",    argString,   userPassword,   sizeof(userPassword),
   "user password (for encrypted files)"},
Jakob Voss's avatar
Jakob Voss committed
99 100
  {"-p",      argFlag,     &pageNames,     0,
   "include page numbers in output file names"},
101 102 103 104 105 106 107 108 109 110 111 112
  {"-q",      argFlag,     &quiet,         0,
   "don't print any messages or errors"},
  {"-v",      argFlag,     &printVersion,  0,
   "print copyright and version info"},
  {"-h",      argFlag,     &printHelp,     0,
   "print usage information"},
  {"-help",   argFlag,     &printHelp,     0,
   "print usage information"},
  {"--help",  argFlag,     &printHelp,     0,
   "print usage information"},
  {"-?",      argFlag,     &printHelp,     0,
   "print usage information"},
113
  {}
114 115 116 117 118
};

int main(int argc, char *argv[]) {
  PDFDoc *doc;
  GooString *fileName;
119
  char *imgRoot = nullptr;
120 121 122 123 124
  GooString *ownerPW, *userPW;
  ImageOutputDev *imgOut;
  GBool ok;
  int exitCode;

125
  Win32Console win32Console(&argc, &argv);
126 127 128 129
  exitCode = 99;

  // parse args
  ok = parseArgs(argDesc, &argc, argv);
130
  if (!ok || (listImages && argc != 2) || (!listImages && argc != 3) || printVersion || printHelp) {
131 132
    fprintf(stderr, "pdfimages version %s\n", PACKAGE_VERSION);
    fprintf(stderr, "%s\n", popplerCopyright);
133 134 135 136
    fprintf(stderr, "%s\n", xpdfCopyright);
    if (!printVersion) {
      printUsage("pdfimages", "<PDF-file> <image-root>", argDesc);
    }
137 138
    if (printVersion || printHelp)
      exitCode = 0;
139 140 141
    goto err0;
  }
  fileName = new GooString(argv[1]);
142 143
  if (!listImages)
    imgRoot = argv[2];
144 145

  // read config file
146
  globalParams = new GlobalParams();
147 148 149 150 151 152 153 154
  if (quiet) {
    globalParams->setErrQuiet(quiet);
  }

  // open PDF file
  if (ownerPassword[0] != '\001') {
    ownerPW = new GooString(ownerPassword);
  } else {
155
    ownerPW = nullptr;
156 157 158 159
  }
  if (userPassword[0] != '\001') {
    userPW = new GooString(userPassword);
  } else {
160
    userPW = nullptr;
161
  }
Hib Eris's avatar
Hib Eris committed
162 163 164 165 166
  if (fileName->cmp("-") == 0) {
      delete fileName;
      fileName = new GooString("fd://0");
  }

167
  doc = PDFDocFactory().createPDFDoc(*fileName, ownerPW, userPW);
Hib Eris's avatar
Hib Eris committed
168 169
  delete fileName;

170 171 172 173 174 175 176 177 178 179 180 181 182 183
  if (userPW) {
    delete userPW;
  }
  if (ownerPW) {
    delete ownerPW;
  }
  if (!doc->isOk()) {
    exitCode = 1;
    goto err1;
  }

  // check for copy permission
#ifdef ENFORCE_PERMISSIONS
  if (!doc->okToCopy()) {
184
    error(errNotAllowed, -1, "Copying of images from this document is not allowed.");
185 186 187 188 189 190 191 192 193 194
    exitCode = 3;
    goto err1;
  }
#endif

  // get page range
  if (firstPage < 1)
    firstPage = 1;
  if (lastPage < 1 || lastPage > doc->getNumPages())
    lastPage = doc->getNumPages();
195 196 197 198 199 200
  if (lastPage < firstPage) {
    error(errCommandLine, -1,
          "Wrong page range given: the first page ({0:d}) can not be after the last page ({1:d}).",
          firstPage, lastPage);
    goto err1;
  }
201 202

  // write image files
203
  imgOut = new ImageOutputDev(imgRoot, pageNames, listImages);
204
  if (imgOut->isOk()) {
205 206
    if (allFormats) {
      imgOut->enablePNG(gTrue);
207
      imgOut->enableTiff(gTrue);
208 209 210 211 212 213 214 215 216 217 218 219
      imgOut->enableJpeg(gTrue);
      imgOut->enableJpeg2000(gTrue);
      imgOut->enableJBig2(gTrue);
      imgOut->enableCCITT(gTrue);
    } else {
      imgOut->enablePNG(enablePNG);
      imgOut->enableTiff(enableTiff);
      imgOut->enableJpeg(dumpJPEG);
      imgOut->enableJpeg2000(dumpJP2);
      imgOut->enableJBig2(dumpJBIG2);
      imgOut->enableCCITT(dumpCCITT);
    }
220 221
    doc->displayPages(imgOut, firstPage, lastPage, 72, 72, 0,
                      gTrue, gFalse, gFalse);
222 223 224 225 226 227 228 229 230 231 232 233 234
  }
  delete imgOut;

  exitCode = 0;

  // clean up
 err1:
  delete doc;
  delete globalParams;
 err0:

  return exitCode;
}