blob: 168848100f074423e8d403061f7cb487f5330dc6 [file] [log] [blame]
//========================================================================
//
// pdftohtml.cc
//
//
// Copyright 1999-2000 G. Ovtcharov
//========================================================================
#include "config.h"
#include <poppler-config.h>
#include <stdio.h>
#include <stdlib.h>
#include <stddef.h>
#include <string.h>
#include <dirent.h>
#include <time.h>
#include "parseargs.h"
#include "goo/GooString.h"
#include "goo/gmem.h"
#include "Object.h"
#include "Stream.h"
#include "Array.h"
#include "Dict.h"
#include "XRef.h"
#include "Catalog.h"
#include "Page.h"
#include "PDFDoc.h"
#include "ABWOutputDev.h"
#include "PSOutputDev.h"
#include "GlobalParams.h"
#include "Error.h"
#include "goo/gfile.h"
#include <libxml/parser.h>
#include <libxml/tree.h>
static int firstPage = 1;
static int lastPage = 0;
static GBool printHelp = gFalse;
GBool stout = gFalse;
static char ownerPassword[33] = "";
static char userPassword[33] = "";
static char textEncName[128] = "";
static ArgDesc argDesc[] = {
{"-f", argInt, &firstPage, 0,
"first page to convert"},
{"-l", argInt, &lastPage, 0,
"last page to convert"},
{"-h", argFlag, &printHelp, 0,
"print usage information"},
{"--help", argFlag, &printHelp, 0,
"print usage information"},
{"--stdout" ,argFlag, &stout, 0,
"use standard output"},
{"--opw", argString, ownerPassword, sizeof(ownerPassword),
"owner password (for encrypted files)"},
{"--upw", argString, userPassword, sizeof(userPassword),
"user password (for encrypted files)"},
{NULL}
};
int main(int argc, char *argv[]) {
PDFDoc *doc = NULL;
GooString *fileName = NULL;
GooString *abwFileName = NULL;
ABWOutputDev *abwOut = NULL;
GBool ok;
GooString *ownerPW, *userPW;
Object info;
int result = 1;
char * outpName;
xmlDocPtr XMLdoc = NULL;
// parse args
parseArgs(argDesc, &argc, argv);
globalParams = new GlobalParams();
fileName = new GooString(argv[1]);
if (stout || (argc < 2)){
outpName = "-";
}
else {
outpName = argv[2];
}
if (ownerPassword[0]) {
ownerPW = new GooString(ownerPassword);
} else {
ownerPW = NULL;
}
if (userPassword[0]) {
userPW = new GooString(userPassword);
} else {
userPW = NULL;
}
doc = new PDFDoc(fileName, ownerPW, userPW);
if (userPW) {
delete userPW;
}
if (ownerPW) {
delete ownerPW;
}
if (!doc || !doc->isOk())
{
fprintf (stderr, "Error opening PDF %s\n", fileName->getCString());
goto error;
}
// check for copy permission
if (!doc->okToCopy()) {
fprintf(stderr, "Copying of text from this document is not allowed.\n");
goto error;
}
XMLdoc = xmlNewDoc(BAD_CAST "1.0");
abwOut = new ABWOutputDev(XMLdoc);
abwOut->setPDFDoc(doc);
if (lastPage == 0 || lastPage > doc->getNumPages ()) lastPage = doc->getNumPages();
if (firstPage < 1) firstPage = 1;
if (abwOut->isOk())
{
doc->displayPages(abwOut, firstPage, lastPage, 72, 72, 0, gTrue, gFalse, gFalse);
abwOut->createABW();
}
if (xmlSaveFormatFileEnc(outpName, XMLdoc, "UTF-8", 1) == -1)
{
fprintf (stderr, "Error saving to %s\n", outpName);
goto error;
}
result = 0;
error:
// clean up
if(globalParams) delete globalParams;
if(doc) delete doc;
if(XMLdoc) xmlFreeDoc(XMLdoc);
if(abwOut) delete abwOut;
// check for memory leaks
Object::memCheck(stderr);
gMemReport(stderr);
return result;
}