//======================================================================== // // pdfseparate.cc // // This file is licensed under the GPLv2 or later // // Copyright (C) 2011, 2012, 2015 Thomas Freitag // Copyright (C) 2012-2014, 2017, 2018 Albert Astals Cid // Copyright (C) 2013, 2016 Pino Toscano // Copyright (C) 2013 Daniel Kahn Gillmor // Copyright (C) 2013 Suzuki Toshiya // Copyright (C) 2017 LĂ©onard Michelet // Copyright (C) 2017 Adrian Johnson // Copyright (C) 2018 Adam Reichold // Copyright (C) 2019 Oliver Sander // //======================================================================== #include "config.h" #include #include #include #include #include #include "parseargs.h" #include "goo/GooString.h" #include "PDFDoc.h" #include "ErrorCodes.h" #include "GlobalParams.h" #include "Win32Console.h" #include static int firstPage = 0; static int lastPage = 0; static bool printVersion = false; static bool printHelp = false; static const ArgDesc argDesc[] = { {"-f", argInt, &firstPage, 0, "first page to extract"}, {"-l", argInt, &lastPage, 0, "last page to extract"}, {"-v", argFlag, &printVersion, 0, "print copyright and version info"}, {"-h", argFlag, &printHelp, 0, "print usage information"}, {"-help", argFlag, &printHelp, 0, "print usage information"}, {"--help", argFlag, &printHelp, 0, "print usage information"}, {"-?", argFlag, &printHelp, 0, "print usage information"}, {} }; static bool extractPages (const char *srcFileName, const char *destFileName) { char pathName[4096]; GooString *gfileName = new GooString (srcFileName); PDFDoc *doc = new PDFDoc (gfileName, nullptr, nullptr, nullptr); if (!doc->isOk()) { error(errSyntaxError, -1, "Could not extract page(s) from damaged file ('{0:s}')", srcFileName); delete doc; return false; } // destFileName can have multiple %% and one %d // We use auxDestFileName to replace all the valid % appearances // by 'A' (random char that is not %), if at the end of replacing // any of the valid appearances there is still any % around, the // pattern is wrong if (firstPage == 0 && lastPage == 0) { firstPage = 1; lastPage = doc->getNumPages(); } if (lastPage == 0) lastPage = doc->getNumPages(); if (firstPage == 0) firstPage = 1; if (lastPage < firstPage) { error(errCommandLine, -1, "Wrong page range given: the first page ({0:d}) can not be after the last page ({1:d}).", firstPage, lastPage); delete doc; return false; } bool foundmatch = false; char *auxDestFileName = strdup(destFileName); char *p = strstr(auxDestFileName, "%d"); if (p != nullptr) { foundmatch = true; *p = 'A'; } else { char pattern[6]; for (int i = 2; i < 10; i++) { sprintf(pattern, "%%0%dd", i); p = strstr(auxDestFileName, pattern); if (p != nullptr) { foundmatch = true; *p = 'A'; break; } } } if (!foundmatch && firstPage != lastPage) { error(errSyntaxError, -1, "'{0:s}' must contain '%d' (or any variant respecting printf format) if more than one page should be extracted, in order to print the page number", destFileName); free(auxDestFileName); delete doc; return false; } // at this point auxDestFileName can only contain %% p = strstr(auxDestFileName, "%%"); while (p != nullptr) { *p = 'A'; *(p + 1) = 'A'; p = strstr(p, "%%"); } // at this point any other % is wrong p = strstr(auxDestFileName, "%"); if (p != nullptr) { error(errSyntaxError, -1, "'{0:s}' can only contain one '%d' pattern", destFileName); free(auxDestFileName); delete doc; return false; } free(auxDestFileName); for (int pageNo = firstPage; pageNo <= lastPage; pageNo++) { snprintf (pathName, sizeof (pathName) - 1, destFileName, pageNo); GooString *gpageName = new GooString (pathName); PDFDoc *pagedoc = new PDFDoc (new GooString (srcFileName), nullptr, nullptr, nullptr); int errCode = pagedoc->savePageAs(gpageName, pageNo); if ( errCode != errNone) { delete gpageName; delete doc; delete pagedoc; return false; } delete pagedoc; delete gpageName; } delete doc; return true; } int main (int argc, char *argv[]) { bool ok; int exitCode; exitCode = 99; // parse args Win32Console win32console(&argc, &argv); ok = parseArgs (argDesc, &argc, argv); if (!ok || argc != 3 || printVersion || printHelp) { fprintf (stderr, "pdfseparate version %s\n", PACKAGE_VERSION); fprintf (stderr, "%s\n", popplerCopyright); fprintf (stderr, "%s\n", xpdfCopyright); if (!printVersion) { printUsage ("pdfseparate", " ", argDesc); } if (printVersion || printHelp) exitCode = 0; goto err0; } globalParams = std::make_unique(); ok = extractPages (argv[1], argv[2]); if (ok) { exitCode = 0; } err0: return exitCode; }