/* * ps.c -- Postscript scanning and copying routines. * Copyright (C) 1992 Timothy O. Theisen * Copyright (C) 2004 Jose E. Marchesi * * This program is free software; you can redistribute it and/or modify * it under the terms of the GNU General Public License as published by * the Free Software Foundation; either version 2 of the License, or * (at your option) any later version. * * This program is distributed in the hope that it will be useful, * but WITHOUT ANY WARRANTY; without even the implied warranty of * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the * GNU General Public License for more details. * * You should have received a copy of the GNU General Public License * along with GNU gv; see the file COPYING. If not, write to * the Free Software Foundation, Inc., 51 Franklin Street, Fifth Floor, * Boston, MA 02110-1301, USA * * Author: Tim Theisen Systems Programmer * Internet: tim@cs.wisc.edu Department of Computer Sciences * UUCP: uwvax!tim University of Wisconsin-Madison * Phone: (608)262-0438 1210 West Dayton Street * FAX: (608)262-9777 Madison, WI 53706 * * Changes submitted by Maurizio Loreti distributed on the public * domain: * * - Code for handle bzip2 compressed files. */ /* * Added the ps_io_*() routines, rewrote readline(), modified * pscopyuntil() and pscopydoc() and eliminated pscopy(). * The modifications mainly aim at * - elimination of the (line length <= 255) constraint since * there are just too many documents ignoring this requirement. * - acceptance of '\r' as line terminator as suggested by * Martin Buck (martin-2.buck@student.uni-ulm.de). * Johannes Plass, 04/96 (plass@thep.physik.uni-mainz.de) * */ /* * > Believe it or not--even Adobe doesn't know how to produce correct * > PS-files. Their Acrobat Reader sometimes starts including other files * > with %%BeginFile instead of %%BeginFile: and even more often ends them * > with just %%EOF instead of %%EndFile. * > Martin Buck, martin-2.buck@student.uni-ulm.de * * Therefore we use Martin's ACROREAD_WORKAROUND (thanks for the patch, Martin). * ###jp### 04/96 * */ /* modified by Russell Lang, rjl@aladdin.com to use with GSview * 1995-01-11 * supports DOS EPS files (binary header) */ #define USE_ACROREAD_WORKAROUND #include #include #ifndef SEEK_SET #define SEEK_SET 0 #endif #ifndef BUFSIZ #define BUFSIZ 1024 #endif #include #include "spectre-utils.h" #include "ps.h" #ifdef BSD4_2 #define memset(a,b,c) bzero(a,c) #endif #define BEGINMESSAGE(txt) #define ENDMESSAGE(txt) #define INFMESSAGE(txt) #define IMESSAGE(it) #define INFIMESSAGE(txt,it) #define FMESSAGE(ft) #define INFFMESSAGE(txt,ft) #define SMESSAGE(st) #define INFSMESSAGE(txt,st) #define IIMESSAGE(it1,it2) #define INFIIMESSAGE(txt,it1,it2) #define PS_malloc(sss) malloc ((size_t)(sss) ) #define PS_calloc(ccc,sss) calloc ((size_t)(ccc),(size_t)(sss) ) #define PS_realloc(ppp,sss) realloc ((void*) (ppp),(size_t)(sss) ) #define PS_free(ppp) free ((void*) (ppp) ) #define PS_cfree(ppp) cfree ((void*) (ppp) ) #define PS_XtMalloc(sss) malloc ((size_t)(sss) ) #define PS_XtRealloc(ppp,sss) realloc ((void*) (ppp),(size_t)(sss) ) #define PS_XtFree(ppp) free ((void*) (ppp) ) /* We use this helper function for providing proper */ /* case and colon :-) insensitive DSC matching */ static int dsc_strncmp(char *s1, char *s2, size_t n) { char *tmp; if (_spectre_strncasecmp(s1, s2, n) == 0) return 0; if (s2[n-1] == ':'){ tmp = (char *) PS_malloc(n*sizeof(char)); strncpy(tmp, s2, (n-1)); tmp[n-1]=' '; if (_spectre_strncasecmp(s1, tmp, n) == 0){ PS_free(tmp); return 0; } PS_free(tmp); } return 1; } /* length calculates string length at compile time */ /* can only be used with character constants */ #define length(a) (sizeof((a))-1) #define iscomment(a, b) (dsc_strncmp((a), (b), length((b))) == 0) #define DSCcomment(a) ((a)[0] == '%' && (a)[1] == '%') /* list of standard paper sizes from Adobe's PPD. */ static const struct documentmedia papersizes[] = { {"BBox", 0, 0}, {"Letter", 612, 792}, {"LetterSmall", 612, 792}, {"Legal", 612, 1008}, {"Statement", 396, 612}, {"Tabloid", 792, 1224}, {"Ledger", 1224, 792}, {"Executive", 540, 720}, {"A0", 2384, 3370}, {"A1", 1684, 2384}, {"A2", 1191, 1684}, {"A3", 842, 1191}, {"A4", 595, 842}, {"A4Small", 595, 842}, {"A5", 420, 595}, {"B4", 729, 1032}, {"B5", 516, 729}, {"Folio", 612, 936}, {"Quarto", 610, 780}, {"10x14", 720, 1008}, { NULL, 0, 0} }; #if NeedFunctionPrototypes # define PT(aaa) aaa #else # define PT(aaa) () #endif typedef enum { False = 0, True } Boolean; /*--------------------------------------------------*/ /* Declarations for ps_io_*() routines. */ typedef struct FileDataStruct_ *FileData; typedef struct FileDataStruct_ { FILE *file; /* file */ int filepos; /* file position corresponding to the start of the line */ char *buf; /* buffer */ int buf_size; /* size of buffer */ int buf_end; /* last char in buffer given as offset to buf */ int line_begin; /* start of the line given as offset to buf */ int line_end; /* end of the line given as offset to buf */ int line_len; /* length of line, i.e. (line_end-line_begin) */ char line_termchar; /* char exchanged for a '\0' at end of line */ int status; /* 0 = okay, 1 = failed */ } FileDataStruct; static FileData ps_io_init PT((FILE *)); static void ps_io_exit PT((FileData)); static void ps_io_rewind PT((FileData)); static char *ps_io_fgetchars PT((FileData, int)); static int ps_io_fseek PT((FileData, int)); static int ps_io_ftell PT((FileData)); static char *readline PT((FileData, long, char **, long *, unsigned int *)); static char *readlineuntil PT((FileData, long, char **, long *, unsigned int *, char)); static char *gettextline PT((char *)); static char *ps_gettext PT((char *,char **)); static int blank PT((char *)); static char *pscopyuntil PT((FileData,FILE *,long,long,char *)); /* DOS EPS header reading */ static unsigned long ps_read_doseps PT((FileData, DOSEPS *)); static PS_DWORD reorder_dword PT((PS_DWORD)); static PS_WORD reorder_word PT((PS_WORD)); static char *skipped_line = "% ps_io_fgetchars: skipped line"; static char *empty_string = ""; static Boolean scan_boundingbox(int *bb, const char *line) { char fllx[21], flly[21], furx[21], fury[21]; if (sscanf (line, "%d %d %d %d", &bb[LLX], &bb[LLY], &bb[URX], &bb[URY]) == 4) return True; if (sscanf (line, "%20s %20s %20s %20s", fllx, flly, furx, fury) == 4) { float ffllx, fflly, ffurx, ffury; ffllx = _spectre_strtod (fllx, NULL); fflly = _spectre_strtod (flly, NULL); ffurx = _spectre_strtod (furx, NULL); ffury = _spectre_strtod (fury, NULL); bb[LLX] = ffllx; bb[LLY] = fflly; bb[URX] = ffurx; bb[URY] = ffury; if (bb[LLX] > ffllx) bb[LLX]--; if (bb[LLY] > fflly) bb[LLY]--; if (bb[URX] < ffurx) bb[URX]++; if (bb[URY] < ffury) bb[URY]++; return True; } return False; } /*--------------------------------------------------*/ /* * psscan -- scan the PostScript file for document structuring comments. * * This scanner is designed to retrieve the information necessary for * the ghostview previewer. It will scan files that conform to any * version (1.0, 2.0, 2.1, or 3.0) of the document structuring conventions. * It does not really care which version of comments the file contains. * (The comments are largely upward compatible.) It will scan a number * of non-conforming documents. (You could have part of the document * conform to V2.0 and the rest conform to V3.0. It would be similar * to the DC-2 1/2+, it would look funny but it can still fly.) * * This routine returns a pointer to the document structure. * The structure contains the information relevant to previewing. * These include EPSF flag (to tell if the file is a encapsulated figure), * Page Media (for the Page Size), Bounding Box (to minimize backing * pixmap size or determine window size for encapsulated PostScript), * Orientation of Paper (for default transformation matrix), and * Page Order. The title and CreationDate are also retrieved to * help identify the document. * * The following comments are examined: * * Header section: * Must start with %!PS-Adobe-. Version numbers ignored. * * %!PS-Adobe-* [EPSF*] (changed EPSF-* to EPSF* to do XFig a favor ...###jp###) * %%BoundingBox: |(atend) * %%CreationDate: * %%Creator: * %%Orientation: Portrait|Landscape|(atend) * %%Pages: []|(atend) * %%PageOrder: Ascend|Descend|Special|(atend) * %%Title: * %%DocumentMedia: * %%DocumentPaperSizes: * %%EndComments * * Note: Either the 3.0 or 2.0 syntax for %%Pages is accepted. * Also either the 2.0 %%DocumentPaperSizes or the 3.0 * %%DocumentMedia comments are accepted as well. * * The header section ends either explicitly with %%EndComments or * implicitly with any line that does not begin with %X where X is * a not whitespace character. * * If the file is encapsulated PostScript the optional Preview section * is next: * * %%BeginPreview * %%EndPreview * * This section explicitly begins and ends with the above comments. * * Next the Defaults section for version 3 page defaults: * * %%BeginDefaults * %%PageBoundingBox: * %%PageOrientation: Portrait|Landscape * %%PageMedia: * %%EndDefaults * * This section explicitly begins and ends with the above comments. * * The prolog section either explicitly starts with %%BeginProlog or * implicitly with any nonblank line. * * %%BeginProlog * %%EndProlog * * The Prolog should end with %%EndProlog, however the proglog implicitly * ends when %%BeginSetup, %%Page, %%Trailer or %%EOF are encountered. * * The Setup section is where the version 2 page defaults are found. * This section either explicitly begins with %%BeginSetup or implicitly * with any nonblank line after the Prolog. * * %%BeginSetup * %%PageBoundingBox: * %%PageOrientation: Portrait|Landscape * %%PaperSize: * %%EndSetup * * The Setup should end with %%EndSetup, however the setup implicitly * ends when %%Page, %%Trailer or %%EOF are encountered. * * Next each page starts explicitly with %%Page and ends implicitly with * %%Page or %%Trailer or %%EOF. The following comments are recognized: * * %%Page: * %%PageBoundingBox: |(atend) * %%PageOrientation: Portrait|Landscape * %%PageMedia: * %%PaperSize: * * The trailer section start explicitly with %%Trailer and end with %%EOF. * The following comment are examined with the proper (atend) notation * was used in the header: * * %%Trailer * %%BoundingBox: |(atend) * %%Orientation: Portrait|Landscape|(atend) * %%Pages: []|(atend) * %%PageOrder: Ascend|Descend|Special|(atend) * %%EOF * * * + A DC-3 received severe damage to one of its wings. The wing was a total * loss. There was no replacement readily available, so the mechanic * installed a wing from a DC-2. */ /*-----------------------------------------------------------*/ #define CHECK_MALLOCED(aaa) /*###########################################################*/ /* psscan */ /*###########################################################*/ struct document * psscan(const char *filename, int scanstyle) { struct document *doc; FILE *file; int bb_set = NONE; int pages_set = NONE; int page_order_set = NONE; int orientation_set = NONE; int page_bb_set = NONE; int page_media_set = NONE; int preread; /* flag which tells the readline isn't needed */ unsigned int i; unsigned int maxpages = 0; unsigned int nextpage = 1; /* Next expected page */ unsigned int thispage; int ignore = 0; /* whether to ignore page ordinals */ char *label; char *line; /* 255 characters + 1 newline + 1 NULL */ char text[PSLINELENGTH]; /* Temporary storage for text */ long position; /* Position of the current line */ long beginsection; /* Position of the beginning of the section */ unsigned int line_len; /* Length of the current line */ unsigned int section_len = 0; /* Place to accumulate the section length */ char *next_char; /* 1st char after text returned by ps_gettext() */ char *cp; ConstMedia dmp; long enddoseps; /* zero of not DOS EPS, otherwise position of end of ps section */ DOSEPS doseps; FileData fd; int respect_eof; /* Derived from the scanstyle argument. If set to 0 EOF comments will be ignored, if set to 1 they will be taken seriously. Purpose; Out there are many documents which include other DSC conforming documents without without enclosing them by 'BeginDocument' and 'EndDocument' comments. This may cause fake EOF comments to appear in the body of a page. Similarly, if respect_eof is set to false 'Trailer' comments are ignored except of the last one found in the document. */ int ignore_dsc; /* Derived from scanstyle. If set the document structure will be ignored. */ BEGINMESSAGE(psscan) respect_eof = (scanstyle & SCANSTYLE_IGNORE_EOF) ? 0 : 1; ignore_dsc = (scanstyle & SCANSTYLE_IGNORE_DSC) ? 1 : 0; if (ignore_dsc) { INFMESSAGE(ignoring DSC) ENDMESSAGE(psscan) return(NULL); } file = fopen (filename, "rb"); if (!file) { return NULL; } fd = ps_io_init(file); /* rjl: check for DOS EPS files and almost DSC files that start with ^D */ enddoseps = ps_read_doseps (fd, &doseps); if (!readline(fd, enddoseps, &line, &position, &line_len)) { fprintf(stderr, "Warning: empty file.\n"); ENDMESSAGE(psscan) ps_io_exit(fd); fclose (file); return(NULL); } /* HP printer job language data follows. Some printer drivers add pjl * commands to switch a pjl printer to postscript mode. If no PS header * follows, this seems to be a real pjl file. */ if(iscomment(line, "\033%-12345X@PJL")) { /* read until first DSC comment */ readlineuntil(fd, enddoseps, &line, &position, &line_len, '%'); if(line[0] != '%') { fprintf(stderr, "psscan error: input files seems to be a PJL file.\n"); ENDMESSAGE(psscan) ps_io_exit(fd); fclose (file); return (NULL); } } /* Header comments */ /* Header should start with "%!PS-Adobe-", but some programms omit * parts of this or add a ^D at the beginning. */ if ((iscomment(line,"%!PS") || iscomment(line, "\004%!PS"))) { INFMESSAGE(found "PS-Adobe-" comment) doc = (struct document *) PS_calloc(1, sizeof(struct document)); CHECK_MALLOCED(doc); /* ignore possible leading ^D */ if (*line == '\004') { position++; line_len--; } doc->ref_count = 1; doc->filename = _spectre_strdup (filename); doc->beginheader = position; section_len = line_len; text[0] = '\0'; sscanf(line, "%%!%256s %*s", text); doc->format = _spectre_strdup (text); text[0] = '\0'; sscanf(line, "%*s %256s", text); doc->epsf = iscomment(text, "EPSF"); } else { /* There are postscript documents that do not have %PS at the beginning, usually unstructured. We should GS decide For instance, the tech reports at this university: http://svrc.it.uq.edu.au/Bibliography/svrc-tr.html?94-45 add ugly PostScript before the actual document. GS and gv is able to display them correctly as unstructured PS. In a way, this makes sense, a program PostScript does not need the !PS at the beginning. */ doc = (struct document *) PS_calloc(1, sizeof(struct document)); CHECK_MALLOCED(doc); doc->ref_count = 1; doc->filename = _spectre_strdup (filename); doc->default_page_orientation = NONE; doc->orientation = NONE; } if (enddoseps) { /* rjl: add doseps header */ doc->doseps = (DOSEPS *) malloc(sizeof(DOSEPS)); *(doc->doseps) = doseps; } preread = 0; while (preread || readline(fd, enddoseps, &line, &position, &line_len)) { if (!preread) section_len += line_len; preread = 0; if (line[0] != '%' || iscomment(line+1, "%EndComments") || line[1] == ' ' || line[1] == '\t' || line[1] == '\n' || !isprint(line[1])) { break; } else if (line[1] != '%') { /* Do nothing */ } else if (doc->title == NULL && iscomment(line+2, "Title:")) { doc->title = gettextline(line+length("%%Title:")); } else if (doc->date == NULL && iscomment(line+2, "CreationDate:")) { doc->date = gettextline(line+length("%%CreationDate:")); } else if (doc->languagelevel == NULL && iscomment(line+2, "LanguageLevel:")) { doc->languagelevel = gettextline(line+length("%%LanguageLevel:")); } else if(doc->creator == NULL && iscomment(line + 2, "Creator:")) { doc->creator = gettextline(line + length("%%Creator:")); } else if(doc->fortext == NULL && iscomment(line + 2, "For:")) { doc->fortext = gettextline(line + length("%%For:")); } else if (bb_set == NONE && iscomment(line+2, "BoundingBox:")) { sscanf(line+length("%%BoundingBox:"), "%256s", text); if (strcmp(text, "(atend)") == 0) { bb_set = ATEND; } else { if (scan_boundingbox(doc->boundingbox, line + length("%%BoundingBox:"))) bb_set = 1; } } else if (orientation_set == NONE && iscomment(line+2, "Orientation:")) { sscanf(line+length("%%Orientation:"), "%256s", text); if (strcmp(text, "(atend)") == 0 || strcmp(text, "atend") == 0) { orientation_set = ATEND; } else if (strcmp(text, "Portrait") == 0) { doc->orientation = PORTRAIT; orientation_set = 1; } else if (strcmp(text, "Landscape") == 0) { doc->orientation = LANDSCAPE; orientation_set = 1; } else if (strcmp(text, "Seascape") == 0) { doc->orientation = SEASCAPE; orientation_set = 1; } else if (strcmp(text, "UpsideDown") == 0) { doc->orientation = UPSIDEDOWN; orientation_set = 1; } } else if (page_order_set == NONE && iscomment(line+2, "PageOrder:")) { sscanf(line+length("%%PageOrder:"), "%256s", text); if (strcmp(text, "(atend)") == 0 || strcmp(text, "atend") == 0) { page_order_set = ATEND; } else if (strcmp(text, "Ascend") == 0) { doc->pageorder = ASCEND; page_order_set = 1; } else if (strcmp(text, "Descend") == 0) { doc->pageorder = DESCEND; page_order_set = 1; } else if (strcmp(text, "Special") == 0) { doc->pageorder = SPECIAL; page_order_set = 1; } } else if (pages_set == NONE && iscomment(line+2, "Pages:")) { sscanf(line+length("%%Pages:"), "%256s", text); if (strcmp(text, "(atend)") == 0 || strcmp(text, "atend") == 0) { pages_set = ATEND; } else { int page_order; switch (sscanf(line+length("%%Pages:"), "%d %d", &maxpages, &page_order)) { case 2: if (page_order_set == NONE) { if (page_order == -1) { doc->pageorder = DESCEND; page_order_set = 1; } else if (page_order == 0) { doc->pageorder = SPECIAL; page_order_set = 1; } else if (page_order == 1) { doc->pageorder = ASCEND; page_order_set = 1; } } case 1: if (maxpages > 0) { doc->pages = (struct page *) PS_calloc(maxpages, sizeof(struct page)); CHECK_MALLOCED(doc->pages); } } } } else if (doc->nummedia == NONE && iscomment(line+2, "DocumentMedia:")) { char w[21], h[21]; doc->media = (Media) PS_calloc(1, sizeof (MediaStruct)); CHECK_MALLOCED(doc->media); doc->media[0].name = ps_gettext(line+length("%%DocumentMedia:"), &next_char); if (doc->media[0].name != NULL) { if (sscanf(next_char, "%20s %20s", w, h) == 2) { doc->media[0].width = _spectre_strtod (w, NULL) + 0.5; doc->media[0].height = _spectre_strtod (h, NULL) + 0.5; } if (doc->media[0].width != 0 && doc->media[0].height != 0) { doc->nummedia = 1; } else { PS_free(doc->media[0].name); doc->media[0].name = NULL; } } preread=1; while (readline(fd, enddoseps, &line, &position, &line_len) && DSCcomment(line) && iscomment(line+2, "+")) { section_len += line_len; doc->media = (Media) PS_realloc(doc->media, (doc->nummedia+1)* sizeof (MediaStruct)); CHECK_MALLOCED(doc->media); memset (doc->media + doc->nummedia, 0, sizeof (MediaStruct)); doc->media[doc->nummedia].name = ps_gettext(line+length("%%+"), &next_char); if (doc->media[doc->nummedia].name != NULL) { if (sscanf(next_char, "%20s %20s", w, h) == 2) { doc->media[doc->nummedia].width = _spectre_strtod (w, NULL) + 0.5; doc->media[doc->nummedia].height = _spectre_strtod (h, NULL) + 0.5; } if (doc->media[doc->nummedia].width != 0 && doc->media[doc->nummedia].height != 0) { doc->nummedia++; } else { PS_free(doc->media[doc->nummedia].name); doc->media[doc->nummedia].name = NULL; } } } section_len += line_len; if (doc->nummedia != 0) doc->default_page_media = doc->media; } else if (doc->nummedia == NONE && iscomment(line+2, "DocumentPaperSizes:")) { doc->media = (Media) PS_calloc(1, sizeof (MediaStruct)); CHECK_MALLOCED(doc->media); doc->media[0].name = ps_gettext(line+length("%%DocumentPaperSizes:"), &next_char); if (doc->media[0].name != NULL) { for (i=0; papersizes[i].name; i++) { dmp = (Media)&papersizes[i]; /* Note: Paper size comment uses down cased paper size * name. Case insensitive compares are only used for * PaperSize comments. */ if (_spectre_strcasecmp(doc->media[0].name, dmp->name) == 0) { PS_free(doc->media[0].name); doc->media[0].name = (char *)PS_malloc(strlen(dmp->name)+1); CHECK_MALLOCED(doc->media[0].name); strcpy(doc->media[0].name, dmp->name); doc->media[0].width = dmp->width; doc->media[0].height = dmp->height; break; } } if (doc->media[0].width != 0 && doc->media[0].height != 0) { doc->nummedia = 1; } else { PS_free(doc->media[0].name); doc->media[0].name = NULL; } } while ((cp = ps_gettext(next_char, &next_char))) { doc->media = (Media) PS_realloc(doc->media, (doc->nummedia+1)* sizeof (MediaStruct)); CHECK_MALLOCED(doc->media); memset (doc->media + doc->nummedia, 0, sizeof (MediaStruct)); doc->media[doc->nummedia].name = cp; for (i=0; papersizes[i].name; i++) { dmp = (Media)&papersizes[i]; /* Note: Paper size comment uses down cased paper size * name. Case insensitive compares are only used for * PaperSize comments. */ if (_spectre_strcasecmp(doc->media[doc->nummedia].name, dmp->name) == 0) { PS_free(doc->media[doc->nummedia].name); doc->media[doc->nummedia].name = (char *)PS_malloc(strlen(dmp->name)+1); CHECK_MALLOCED(doc->media[doc->nummedia].name); strcpy(doc->media[doc->nummedia].name, dmp->name); doc->media[doc->nummedia].width = dmp->width; doc->media[doc->nummedia].height = dmp->height; break; } } if (doc->media[doc->nummedia].width != 0 && doc->media[doc->nummedia].height != 0) { doc->nummedia++; } else { PS_free(doc->media[doc->nummedia].name); doc->media[doc->nummedia].name = NULL; } } preread=1; while (readline(fd, enddoseps, &line, &position, &line_len) && DSCcomment(line) && iscomment(line+2, "+")) { section_len += line_len; next_char = line + length("%%+"); while ((cp = ps_gettext(next_char, &next_char))) { doc->media = (Media) PS_realloc(doc->media, (doc->nummedia+1)* sizeof (MediaStruct)); CHECK_MALLOCED(doc->media); memset (doc->media + doc->nummedia, 0, sizeof (MediaStruct)); doc->media[doc->nummedia].name = cp; for (i=0; papersizes[i].name; i++) { dmp = (Media)&papersizes[i]; /* Note: Paper size comment uses down cased paper size * name. Case insensitive compares are only used for * PaperSize comments. */ if (_spectre_strcasecmp(doc->media[doc->nummedia].name, dmp->name) == 0) { doc->media[doc->nummedia].width = dmp->width; doc->media[doc->nummedia].height = dmp->height; break; } } if (doc->media[doc->nummedia].width != 0 && doc->media[doc->nummedia].height != 0) { doc->nummedia++; } else { PS_free(doc->media[doc->nummedia].name); doc->media[doc->nummedia].name = NULL; } } } section_len += line_len; if (doc->nummedia != 0) doc->default_page_media = doc->media; } } if (DSCcomment(line) && iscomment(line+2, "EndComments")) { readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; } doc->endheader = position; doc->lenheader = section_len - line_len; /* Optional Preview comments for encapsulated PostScript files */ beginsection = position; section_len = line_len; while (blank(line) && readline(fd, enddoseps, &line, &position, &line_len)) { section_len += line_len; } if (doc->epsf && DSCcomment(line) && iscomment(line+2, "BeginPreview")) { doc->beginpreview = beginsection; beginsection = 0; while (readline(fd, enddoseps, &line, &position, &line_len) && !(DSCcomment(line) && iscomment(line+2, "EndPreview"))) { section_len += line_len; } section_len += line_len; readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; doc->endpreview = position; doc->lenpreview = section_len - line_len; } /* Page Defaults for Version 3.0 files */ if (beginsection == 0) { beginsection = position; section_len = line_len; } while (blank(line) && readline(fd, enddoseps, &line, &position, &line_len)) { section_len += line_len; } if (DSCcomment(line) && iscomment(line+2, "BeginDefaults")) { doc->begindefaults = beginsection; beginsection = 0; while (readline(fd, enddoseps, &line, &position, &line_len) && !(DSCcomment(line) && iscomment(line+2, "EndDefaults"))) { section_len += line_len; if (!DSCcomment(line)) { /* Do nothing */ } else if (doc->default_page_orientation == NONE && iscomment(line+2, "PageOrientation:")) { sscanf(line+length("%%PageOrientation:"), "%256s", text); if (strcmp(text, "Portrait") == 0) { doc->default_page_orientation = PORTRAIT; } else if (strcmp(text, "Landscape") == 0) { doc->default_page_orientation = LANDSCAPE; } else if (strcmp(text, "Seascape") == 0) { doc->default_page_orientation = SEASCAPE; } else if (strcmp(text, "UpsideDown") == 0) { doc->default_page_orientation = UPSIDEDOWN; } } else if (page_media_set == NONE && iscomment(line+2, "PageMedia:")) { cp = ps_gettext(line+length("%%PageMedia:"), NULL); for (dmp = doc->media, i=0; inummedia; i++, dmp++) { if (strcmp(cp, dmp->name) == 0) { doc->default_page_media = dmp; page_media_set = 1; break; } } PS_free(cp); } else if (page_bb_set == NONE && iscomment(line+2, "PageBoundingBox:")) { if (scan_boundingbox(doc->default_page_boundingbox, line+length("%%PageBoundingBox:"))) page_bb_set = 1; } } section_len += line_len; readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; doc->enddefaults = position; doc->lendefaults = section_len - line_len; } /* Document Prolog */ if (beginsection == 0) { beginsection = position; section_len = line_len; } while (blank(line) && readline(fd, enddoseps, &line, &position, &line_len)) { section_len += line_len; } if (!(DSCcomment(line) && (iscomment(line+2, "BeginSetup") || iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || iscomment(line+2, "EOF")))) { doc->beginprolog = beginsection; beginsection = 0; preread = 1; while ((preread || readline(fd, enddoseps, &line, &position, &line_len)) && !(DSCcomment(line) && (iscomment(line+2, "EndProlog") || iscomment(line+2, "BeginSetup") || iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || iscomment(line+2, "EOF")))) { if (!preread) section_len += line_len; preread = 0; } section_len += line_len; if (DSCcomment(line) && iscomment(line+2, "EndProlog")) { readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; } doc->endprolog = position; doc->lenprolog = section_len - line_len; } /* Document Setup, Page Defaults found here for Version 2 files */ if (beginsection == 0) { beginsection = position; section_len = line_len; } while (blank(line) && readline(fd, enddoseps, &line, &position, &line_len)) { section_len += line_len; } if (!(DSCcomment(line) && (iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || (respect_eof && iscomment(line+2, "EOF"))))) { doc->beginsetup = beginsection; beginsection = 0; preread = 1; while ((preread || readline(fd, enddoseps, &line, &position, &line_len)) && !(DSCcomment(line) && (iscomment(line+2, "EndSetup") || iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || (respect_eof && iscomment(line+2, "EOF"))))) { if (!preread) section_len += line_len; preread = 0; if (!DSCcomment(line)) { /* Do nothing */ } else if (doc->default_page_orientation == NONE && iscomment(line+2, "PageOrientation:")) { sscanf(line+length("%%PageOrientation:"), "%256s", text); if (strcmp(text, "Portrait") == 0) { doc->default_page_orientation = PORTRAIT; } else if (strcmp(text, "Landscape") == 0) { doc->default_page_orientation = LANDSCAPE; } else if (strcmp(text, "Seascape") == 0) { doc->default_page_orientation = SEASCAPE; } else if (strcmp(text, "UpsideDown") == 0) { doc->default_page_orientation = UPSIDEDOWN; } } else if (page_media_set == NONE && iscomment(line+2, "PaperSize:")) { cp = ps_gettext(line+length("%%PaperSize:"), NULL); for (dmp = doc->media, i=0; inummedia; i++, dmp++) { /* Note: Paper size comment uses down cased paper size * name. Case insensitive compares are only used for * PaperSize comments. */ if (_spectre_strcasecmp(cp, dmp->name) == 0) { doc->default_page_media = dmp; page_media_set = 1; break; } } PS_free(cp); } else if (page_bb_set == NONE && iscomment(line+2, "PageBoundingBox:")) { if (scan_boundingbox(doc->default_page_boundingbox, line+length("%%PageBoundingBox:"))) page_bb_set = 1; } } section_len += line_len; if (DSCcomment(line) && iscomment(line+2, "EndSetup")) { readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; } doc->endsetup = position; doc->lensetup = section_len - line_len; } /* BEGIN Mozilla fix. Some documents generated by mozilla have resources between %%EndProlog and the first page and there isn't any setup section. So instead of including such resources in the first page, we add them here as an implicit setup section */ else if (doc->endprolog != position) { doc->beginsetup = beginsection; doc->endsetup = position; doc->lensetup = section_len - line_len; beginsection = 0; } /* END Mozilla fix */ /* BEGIN Windows NT fix ###jp### Mark Pfeifer (pfeiferm%ppddev@comet.cmis.abbott.com) told me about problems when viewing Windows NT 3.51 generated postscript files with gv. He found that the relevant postscript files show important postscript code after the '%%EndSetup' and before the first page comment '%%Page: x y'. */ if (doc->beginsetup) { while (!(DSCcomment(line) && (iscomment(line+2, "EndSetup") || (iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || (respect_eof && iscomment(line+2, "EOF"))))) && (readline(fd, enddoseps, &line, &position, &line_len))) { section_len += line_len; doc->lensetup = section_len - line_len; doc->endsetup = position; } } /* END Windows NT fix ###jp##*/ /* Individual Pages */ if (beginsection == 0) { beginsection = position; section_len = line_len; } while (blank(line) && readline(fd, enddoseps, &line, &position, &line_len)) { section_len += line_len; } newpage: while (DSCcomment(line) && iscomment(line+2, "Page:")) { if (maxpages == 0) { maxpages = 1; doc->pages = (struct page *) PS_calloc(maxpages, sizeof(struct page)); CHECK_MALLOCED(doc->pages); } label = ps_gettext(line+length("%%Page:"), &next_char); if (sscanf(next_char, "%d", &thispage) != 1) thispage = 0; if (nextpage == 1) { ignore = thispage != 1; } if (!ignore && thispage != nextpage) { PS_free(label); doc->numpages--; goto continuepage; } nextpage++; if (doc->numpages == maxpages) { maxpages++; doc->pages = (struct page *) PS_realloc(doc->pages, maxpages*sizeof (struct page)); CHECK_MALLOCED(doc->pages); } memset(&(doc->pages[doc->numpages]), 0, sizeof(struct page)); page_bb_set = NONE; doc->pages[doc->numpages].label = label; if (beginsection) { doc->pages[doc->numpages].begin = beginsection; beginsection = 0; } else { doc->pages[doc->numpages].begin = position; section_len = line_len; } continuepage: while (readline(fd, enddoseps, &line, &position, &line_len) && !(DSCcomment(line) && (iscomment(line+2, "Page:") || iscomment(line+2, "Trailer") || (respect_eof && iscomment(line+2, "EOF"))))) { section_len += line_len; if (!DSCcomment(line)) { /* Do nothing */ } else if (doc->pages[doc->numpages].orientation == NONE && iscomment(line+2, "PageOrientation:")) { sscanf(line+length("%%PageOrientation:"), "%256s", text); if (strcmp(text, "Portrait") == 0) { doc->pages[doc->numpages].orientation = PORTRAIT; } else if (strcmp(text, "Landscape") == 0) { doc->pages[doc->numpages].orientation = LANDSCAPE; } else if (strcmp(text, "Seascape") == 0) { doc->pages[doc->numpages].orientation = SEASCAPE; } else if (strcmp(text, "UpsideDown") == 0) { doc->pages[doc->numpages].orientation = UPSIDEDOWN; } } else if (doc->pages[doc->numpages].media == NULL && iscomment(line+2, "PageMedia:")) { cp = ps_gettext(line+length("%%PageMedia:"), NULL); for (dmp = doc->media, i=0; inummedia; i++, dmp++) { if (strcmp(cp, dmp->name) == 0) { doc->pages[doc->numpages].media = dmp; break; } } PS_free(cp); } else if (doc->pages[doc->numpages].media == NULL && iscomment(line+2, "PaperSize:")) { cp = ps_gettext(line+length("%%PaperSize:"), NULL); for (dmp = doc->media, i=0; inummedia; i++, dmp++) { /* Note: Paper size comment uses down cased paper size * name. Case insensitive compares are only used for * PaperSize comments. */ if (_spectre_strcasecmp(cp, dmp->name) == 0) { doc->pages[doc->numpages].media = dmp; break; } } PS_free(cp); } else if ((page_bb_set == NONE || page_bb_set == ATEND) && iscomment(line+2, "PageBoundingBox:")) { sscanf(line+length("%%PageBoundingBox:"), "%256s", text); if (strcmp(text, "(atend)") == 0 || strcmp(text, "atend") == 0) { page_bb_set = ATEND; } else { if (scan_boundingbox(doc->pages[doc->numpages].boundingbox, line+length("%%PageBoundingBox:"))) if(page_bb_set == NONE) page_bb_set = 1; } } } section_len += line_len; doc->pages[doc->numpages].end = position; doc->pages[doc->numpages].len = section_len - line_len; doc->numpages++; } /* Document Trailer */ if (beginsection) { doc->begintrailer = beginsection; beginsection = 0; } else { doc->begintrailer = position; section_len = line_len; } preread = 1; while ((preread || readline(fd, enddoseps, &line, &position, &line_len)) && !(respect_eof && DSCcomment(line) && iscomment(line+2, "EOF"))) { if (!preread) section_len += line_len; preread = 0; if (!DSCcomment(line)) { /* Do nothing */ } else if (iscomment(line+2, "Page:")) { PS_free(ps_gettext(line+length("%%Page:"), &next_char)); if (sscanf(next_char, "%d", &thispage) != 1) thispage = 0; if (!ignore && thispage == nextpage) { if (doc->numpages > 0) { doc->pages[doc->numpages-1].end = position; doc->pages[doc->numpages-1].len += section_len - line_len; } else { if (doc->endsetup) { doc->endsetup = position; doc->endsetup += section_len - line_len; } else if (doc->endprolog) { doc->endprolog = position; doc->endprolog += section_len - line_len; } } goto newpage; } } else if (!respect_eof && iscomment(line+2, "Trailer")) { /* What we thought was the start of the trailer was really */ /* the trailer of an EPS on the page. */ /* Set the end of the page to this trailer and keep scanning. */ if (doc->numpages > 0) { doc->pages[ doc->numpages-1 ].end = position; doc->pages[ doc->numpages-1 ].len += section_len - line_len; } doc->begintrailer = position; section_len = line_len; } else if (bb_set == ATEND && iscomment(line+2, "BoundingBox:")) { scan_boundingbox(doc->boundingbox, line + length("%%BoundingBox:")); } else if (orientation_set == ATEND && iscomment(line+2, "Orientation:")) { sscanf(line+length("%%Orientation:"), "%256s", text); if (strcmp(text, "Portrait") == 0) { doc->orientation = PORTRAIT; } else if (strcmp(text, "Landscape") == 0) { doc->orientation = LANDSCAPE; } else if (strcmp(text, "Seascape") == 0) { doc->orientation = SEASCAPE; } else if (strcmp(text, "UpsideDown") == 0) { doc->orientation = UPSIDEDOWN; } } else if (page_order_set == ATEND && iscomment(line+2, "PageOrder:")) { sscanf(line+length("%%PageOrder:"), "%256s", text); if (strcmp(text, "Ascend") == 0) { doc->pageorder = ASCEND; } else if (strcmp(text, "Descend") == 0) { doc->pageorder = DESCEND; } else if (strcmp(text, "Special") == 0) { doc->pageorder = SPECIAL; } } else if (pages_set == ATEND && iscomment(line+2, "Pages:")) { int page_order; if (sscanf(line+length("%%Pages:"), "%*u %d", &page_order) == 1) { if (page_order_set == NONE) { if (page_order == -1) doc->pageorder = DESCEND; else if (page_order == 0) doc->pageorder = SPECIAL; else if (page_order == 1) doc->pageorder = ASCEND; } } } } section_len += line_len; if (DSCcomment(line) && iscomment(line+2, "EOF")) { readline(fd, enddoseps, &line, &position, &line_len); section_len += line_len; } doc->endtrailer = position; doc->lentrailer = section_len - line_len; #if 0 section_len = line_len; preread = 1; while (preread || readline(fd, enddoseps, &line, &position, &line_len)) { if (!preread) section_len += line_len; preread = 0; if (DSCcomment(line) && iscomment(line+2, "Page:")) { PS_free(ps_gettext(line+length("%%Page:"), &next_char)); if (sscanf(next_char, "%d", &thispage) != 1) thispage = 0; if (!ignore && thispage == nextpage) { if (doc->numpages > 0) { doc->pages[doc->numpages-1].end = position; doc->pages[doc->numpages-1].len += doc->lentrailer + section_len - line_len; } else { if (doc->endsetup) { doc->endsetup = position; doc->endsetup += doc->lentrailer + section_len - line_len; } else if (doc->endprolog) { doc->endprolog = position; doc->endprolog += doc->lentrailer + section_len - line_len; } } goto newpage; } } } #endif ENDMESSAGE(psscan) ps_io_exit(fd); fclose (file); return doc; } /*###########################################################*/ /* * psfree -- free dynamic storage associated with document structure. */ /*###########################################################*/ static void psfree(struct document *doc) { unsigned int i; BEGINMESSAGE(psfree) if (doc) { for (i=0; inumpages; i++) { if (doc->pages[i].label) PS_free(doc->pages[i].label); } for (i=0; inummedia; i++) { if (doc->media[i].name) PS_free(doc->media[i].name); } if (doc->format) PS_free(doc->format); if (doc->filename) PS_free(doc->filename); if (doc->creator) PS_free(doc->creator); if (doc->fortext) PS_free(doc->fortext); if (doc->title) PS_free(doc->title); if (doc->date) PS_free(doc->date); if (doc->pages) PS_free(doc->pages); if (doc->media) PS_free(doc->media); if (doc->languagelevel) PS_free(doc->languagelevel); if (doc->doseps) free(doc->doseps); /* rjl: */ PS_free(doc); } ENDMESSAGE(psfree) } void psdocdestroy (struct document *doc) { if (!doc) return; _spectre_assert (doc->ref_count > 0); doc->ref_count--; if (doc->ref_count) return; psfree (doc); } struct document * psdocreference (struct document *doc) { if (!doc) return NULL; _spectre_assert (doc->ref_count > 0); doc->ref_count++; return doc; } /*----------------------------------------------------------*/ /* * gettextline -- skip over white space and return the rest of the line. * If the text begins with '(' return the text string * using ps_gettext(). */ /*----------------------------------------------------------*/ static char * gettextline(line) char *line; { char *cp; BEGINMESSAGE(gettextline) while (*line && (*line == ' ' || *line == '\t')) line++; if (*line == '(') { ENDMESSAGE(gettextline) return ps_gettext(line, NULL); } else { if (strlen(line) == 0) {ENDMESSAGE(gettextline) return NULL;} cp = (char *) PS_malloc(strlen(line)); CHECK_MALLOCED(cp); strncpy(cp, line, strlen(line)-1); cp[strlen(line)-1] = '\0'; ENDMESSAGE(gettextline) return cp; } } /*----------------------------------------------------------*/ /* * ps_gettext -- return the next text string on the line. * return NULL if nothing is present. */ /*----------------------------------------------------------*/ static char * ps_gettext(line, next_char) char *line; char **next_char; { char text[PSLINELENGTH]; /* Temporary storage for text */ char *cp; int quoted=0; BEGINMESSAGE(ps_gettext) while (*line && (*line == ' ' || *line == '\t')) line++; cp = text; if (*line == '(') { int level = 0; quoted=1; line++; while (*line && !(*line == ')' && level == 0 )) { if (cp - text >= PSLINELENGTH - 1) break; if (*line == '\\') { if (*(line+1) == 'n') { *cp++ = '\n'; line += 2; } else if (*(line+1) == 'r') { *cp++ = '\r'; line += 2; } else if (*(line+1) == 't') { *cp++ = '\t'; line += 2; } else if (*(line+1) == 'b') { *cp++ = '\b'; line += 2; } else if (*(line+1) == 'f') { *cp++ = '\f'; line += 2; } else if (*(line+1) == '\\') { *cp++ = '\\'; line += 2; } else if (*(line+1) == '(') { *cp++ = '('; line += 2; } else if (*(line+1) == ')') { *cp++ = ')'; line += 2; } else if (*(line+1) >= '0' && *(line+1) <= '9') { if (*(line+2) >= '0' && *(line+2) <= '9') { if (*(line+3) >= '0' && *(line+3) <= '9') { *cp++ = ((*(line+1) - '0')*8 + *(line+2) - '0')*8 + *(line+3) - '0'; line += 4; } else { *cp++ = (*(line+1) - '0')*8 + *(line+2) - '0'; line += 3; } } else { *cp++ = *(line+1) - '0'; line += 2; } } else { line++; *cp++ = *line++; } } else if (*line == '(') { level++; *cp++ = *line++; } else if (*line == ')') { level--; *cp++ = *line++; } else { *cp++ = *line++; } } /* Delete trailing ')' */ if (*line == ')') { line++; } } else { while (*line && !(*line == ' ' || *line == '\t' || *line == '\n')) { if (cp - text >= PSLINELENGTH - 2) break; *cp++ = *line++; } } *cp = '\0'; if (next_char) *next_char = line; if (!quoted && strlen(text) == 0) {ENDMESSAGE(ps_gettext) return NULL;} cp = (char *) PS_malloc(strlen(text)+1); CHECK_MALLOCED(cp); strcpy(cp, text); ENDMESSAGE(ps_gettext) return cp; } /*----------------------------------------------------------*/ /* ps_io_init */ /*----------------------------------------------------------*/ #define FD_FILE (fd->file) #define FD_FILEPOS (fd->filepos) #define FD_LINE_BEGIN (fd->line_begin) #define FD_LINE_END (fd->line_end) #define FD_LINE_LEN (fd->line_len) #define FD_LINE_TERMCHAR (fd->line_termchar) #define FD_BUF (fd->buf) #define FD_BUF_END (fd->buf_end) #define FD_BUF_SIZE (fd->buf_size) #define FD_STATUS (fd->status) #define FD_STATUS_OKAY 0 #define FD_STATUS_BUFTOOLARGE 1 #define FD_STATUS_NOMORECHARS 2 #define LINE_CHUNK_SIZE 4096 #define MAX_PS_IO_FGETCHARS_BUF_SIZE 57344 #define BREAK_PS_IO_FGETCHARS_BUF_SIZE 49152 static FileData ps_io_init(file) FILE *file; { FileData fd; size_t size = sizeof(FileDataStruct); BEGINMESSAGE(ps_io_init) fd = (FileData) PS_XtMalloc(size); memset((void*) fd ,0,(size_t)size); rewind(file); FD_FILE = file; FD_FILEPOS = ftell(file); FD_BUF_SIZE = (2*LINE_CHUNK_SIZE)+1; FD_BUF = PS_XtMalloc(FD_BUF_SIZE); FD_BUF[0] = '\0'; ENDMESSAGE(ps_io_init) return(fd); } /*----------------------------------------------------------*/ /* ps_io_rewind */ /*----------------------------------------------------------*/ static void ps_io_rewind(fd) FileData fd; { rewind(FD_FILE); FD_FILEPOS = ftell(FD_FILE); FD_BUF[0] = '\0'; FD_BUF_END = 0; FD_BUF_SIZE = 0; FD_LINE_BEGIN = 0; FD_LINE_END = 0; FD_LINE_LEN = 0; FD_LINE_TERMCHAR = '\0'; FD_STATUS = FD_STATUS_OKAY; } /*----------------------------------------------------------*/ /* ps_io_exit */ /*----------------------------------------------------------*/ static void ps_io_exit(fd) FileData fd; { BEGINMESSAGE(ps_io_exit) PS_XtFree(FD_BUF); PS_XtFree(fd); ENDMESSAGE(ps_io_exit) } /*----------------------------------------------------------*/ /* ps_io_fseek */ /*----------------------------------------------------------*/ static int ps_io_fseek(fd,offset) FileData fd; int offset; { int status; BEGINMESSAGE(ps_io_fseek) status=fseek(FD_FILE,(long)offset,SEEK_SET); FD_BUF_END = FD_LINE_BEGIN = FD_LINE_END = FD_LINE_LEN = 0; FD_FILEPOS = offset; FD_STATUS = FD_STATUS_OKAY; ENDMESSAGE(ps_io_fseek) return(status); } /*----------------------------------------------------------*/ /* ps_io_ftell */ /*----------------------------------------------------------*/ static int ps_io_ftell(fd) FileData fd; { BEGINMESSAGE(ps_io_ftell) IMESSAGE(FD_FILEPOS) ENDMESSAGE(ps_io_ftell) return(FD_FILEPOS); } /*----------------------------------------------------------*/ /* ps_io_fgetchars */ /*----------------------------------------------------------*/ #ifdef USE_MEMMOVE_CODE static void ps_memmove (d, s, l) char *d; const char *s; unsigned l; { if (s < d) for (s += l, d += l; l; --l) *--d = *--s; else if (s != d) for (; l; --l) *d++ = *s++; } #else # define ps_memmove memmove #endif static char * ps_io_fgetchars(fd,num) FileData fd; int num; { char *eol=NULL,*tmp; size_t size_of_char = sizeof(char); BEGINMESSAGE(ps_io_fgetchars) if (FD_STATUS != FD_STATUS_OKAY) { INFMESSAGE(aborting since status not okay) ENDMESSAGE(ps_io_fgetchars) return(NULL); } FD_BUF[FD_LINE_END] = FD_LINE_TERMCHAR; /* restoring char previously exchanged against '\0' */ FD_LINE_BEGIN = FD_LINE_END; #if 0 { int fp = (int)(ftell(FD_FILE)); if (num<0) { INFMESSAGE(reading line) } else { INFMESSAGE(reading specified num of chars) } IIMESSAGE(FD_BUF_SIZE,FD_BUF_END) IIMESSAGE(FD_LINE_BEGIN,FD_LINE_END) INFIMESSAGE(unparsed:,FD_BUF_END-FD_LINE_END) IMESSAGE(fp) IIMESSAGE(FD_FILEPOS,fp-(FD_BUF_END-FD_LINE_END)) } #endif /* 0 */ do { if (num<0) { /* reading whole line */ if (FD_BUF_END-FD_LINE_END) { /* strpbrk is faster but fails on lines with embedded NULLs eol = strpbrk(FD_BUF+FD_LINE_END,"\n\r"); */ tmp = FD_BUF + FD_BUF_END; eol = FD_BUF + FD_LINE_END; while (eol < tmp && *eol != '\n' && *eol != '\r') eol++; if (eol >= tmp) eol = NULL; if (eol) { if (*eol=='\r' && *(eol+1)=='\n') eol += 2; else eol++; break; } } } else { /* reading specified num of chars */ if (FD_BUF_END >= FD_LINE_BEGIN+num) { eol = FD_BUF+FD_LINE_BEGIN+num; break; } } INFMESSAGE(no end of line yet) if (FD_BUF_END - FD_LINE_BEGIN > BREAK_PS_IO_FGETCHARS_BUF_SIZE) { INFMESSAGE(breaking line artificially) eol = FD_BUF + FD_BUF_END - 1; break; } while (FD_BUF_SIZE < FD_BUF_END+LINE_CHUNK_SIZE+1) { if (FD_BUF_SIZE > MAX_PS_IO_FGETCHARS_BUF_SIZE) { /* we should never get here, since the line is broken artificially after BREAK_PS_IO_FGETCHARS_BUF_SIZE bytes. */ INFMESSAGE(buffer became to large) ENDMESSAGE(ps_io_fgetchars) fprintf(stderr, "gv: ps_io_fgetchars: Fatal Error: buffer became too large.\n"); exit(-1); } if (FD_LINE_BEGIN) { INFMESSAGE(moving line to begin of buffer) ps_memmove((void*)FD_BUF,(void*)(FD_BUF+FD_LINE_BEGIN), ((size_t)(FD_BUF_END-FD_LINE_BEGIN+1))*size_of_char); FD_BUF_END -= FD_LINE_BEGIN; FD_LINE_BEGIN = 0; } else { INFMESSAGE(enlarging buffer) /* FD_BUF_SIZE = FD_BUF_END+LINE_CHUNK_SIZE+1; */ FD_BUF_SIZE = FD_BUF_SIZE+LINE_CHUNK_SIZE+1; IMESSAGE(FD_BUF_SIZE) FD_BUF = PS_XtRealloc(FD_BUF,FD_BUF_SIZE); } } FD_LINE_END = FD_BUF_END; /* read() seems to fail sometimes (? ? ?) so we always use fread ###jp###,07/31/96*/ FD_BUF_END += fread(FD_BUF+FD_BUF_END,size_of_char,LINE_CHUNK_SIZE,FD_FILE); FD_BUF[FD_BUF_END] = '\0'; if (FD_BUF_END-FD_LINE_END == 0) { INFMESSAGE(failed to read more chars) ENDMESSAGE(ps_io_fgetchars) FD_STATUS = FD_STATUS_NOMORECHARS; return(NULL); } } while (1); FD_LINE_END = eol - FD_BUF; FD_LINE_LEN = FD_LINE_END - FD_LINE_BEGIN; FD_LINE_TERMCHAR = FD_BUF[FD_LINE_END]; FD_BUF[FD_LINE_END] = '\0'; #ifdef USE_FTELL_FOR_FILEPOS if (FD_LINE_END==FD_BUF_END) { INFMESSAGE(### using ftell to get FD_FILEPOS) /* For VMS we cannot assume that the record is FD_LINE_LEN bytes long on the disk. For stream_lf and stream_cr that is true, but not for other formats, since VAXC/DECC converts the formatting into a single \n. eg. variable format files have a 2-byte length and padding to an even number of characters. So, we use ftell for each record. This still will not work if we need to fseek to a \n or \r inside a variable record (ftell always returns the start of the record in this case). (Tim Adye, adye@v2.rl.ac.uk) */ FD_FILEPOS = ftell(FD_FILE); } else #endif /* USE_FTELL_FOR_FILEPOS */ FD_FILEPOS += FD_LINE_LEN; #if 0 SMESSAGE(FD_BUF+FD_LINE_BEGIN) IIMESSAGE(FD_LINE_BEGIN,FD_LINE_END) IIMESSAGE(FD_BUF_END,FD_LINE_LEN) #endif ENDMESSAGE(ps_io_fgetchars) return(FD_BUF+FD_LINE_BEGIN); } /*----------------------------------------------------------*/ /* readline() Read the next line in the postscript file. Automatically skip over data (as indicated by %%BeginBinary/%%EndBinary or %%BeginData/%%EndData comments.) Also, skip over included documents (as indicated by %%BeginDocument/%%EndDocument comments.) */ /*----------------------------------------------------------*/ static char * readline (fd, enddoseps, lineP, positionP, line_lenP) FileData fd; long enddoseps; char **lineP; long *positionP; unsigned int *line_lenP; { unsigned int nbytes=0; int skipped=0; int nesting_level=0; char *line; BEGINMESSAGE(readline) if (positionP) *positionP = FD_FILEPOS; if (positionP && enddoseps) { if (*positionP >= enddoseps) return NULL; /* don't read any more, we have reached end of dos eps section */ } line = ps_io_fgetchars(fd,-1); if (!line) { INFMESSAGE(could not get line) *line_lenP = 0; *lineP = empty_string; ENDMESSAGE(readline) return(NULL); } *line_lenP = FD_LINE_LEN; #define IS_COMMENT(comment) \ (DSCcomment(line) && iscomment(line+2,(comment))) #define IS_BEGIN(comment) \ (iscomment(line+7,(comment))) #define IS_END(comment) \ (iscomment(line+5,(comment))) #define SKIP_WHILE(cond) \ while (readline(fd, enddoseps, &line, NULL, &nbytes) && (cond)) *line_lenP += nbytes; \ skipped=1; #define SKIP_UNTIL_1(comment) { \ INFMESSAGE(skipping until comment) \ SKIP_WHILE((!IS_COMMENT(comment))) \ INFMESSAGE(completed skipping until comment) \ } #define SKIP_UNTIL_2(comment1,comment2) { \ INFMESSAGE(skipping until comment1 or comment2)\ SKIP_WHILE((!IS_COMMENT(comment1) && !IS_COMMENT(comment2)))\ INFMESSAGE(completed skipping until comment1 or comment2)\ } #if 0 if ((scanstyle&SCANSTYLE_MISSING_BEGINDOCUMENT) && (line[0] == '%') && (*line_lenP > 11) && (iscomment(line,"%!PS-Adobe-") || iscomment(line + 1,"%!PS-Adobe-"))) { char *c=line+11; while (*c && !isspace(*c)) c++; if (isspace(*c)) while (*c && isspace(*c)) c++; /* don't skip EPSF files */ printf("line in question: %s\n",line); if (strncmp(c,"EPSF",4)) { printf("skipping starts here: %s\n",line); SKIP_UNTIL_1("EOF") *line_lenP += nbytes; readline(fd, enddoseps, &line, NULL, &nbytes); printf("skipping ends here: %s\n",line); } } else #endif if (!IS_COMMENT("Begin")) {} /* Do nothing */ else if IS_BEGIN("Document:") { /* Skip the EPS without handling its content */ nesting_level=1; line = ps_io_fgetchars(fd,-1); if (line) *line_lenP += FD_LINE_LEN; while (line) { if (IS_COMMENT("Begin") && IS_BEGIN("Document:")) nesting_level++; else if (IS_COMMENT("End") && IS_END("Document")) nesting_level--; if (nesting_level == 0) break; line = ps_io_fgetchars(fd,-1); if (line) *line_lenP += FD_LINE_LEN; } } else if IS_BEGIN("Feature:") SKIP_UNTIL_1("EndFeature") #ifdef USE_ACROREAD_WORKAROUND else if IS_BEGIN("File") SKIP_UNTIL_2("EndFile","EOF") #else else if IS_BEGIN("File") SKIP_UNTIL_1("EndFile") #endif else if IS_BEGIN("Font") SKIP_UNTIL_1("EndFont") else if IS_BEGIN("ProcSet") SKIP_UNTIL_1("EndProcSet") else if IS_BEGIN("Resource") SKIP_UNTIL_1("EndResource") else if IS_BEGIN("Data:") { int num; char text[101]; INFMESSAGE(encountered "BeginData:") if (FD_LINE_LEN > 100) FD_BUF[100] = '\0'; text[0] = '\0'; if (sscanf(line+length("%%BeginData:"), "%d %*s %100s", &num, text) >= 1) { if (strcmp(text, "Lines") == 0) { INFIMESSAGE(number of lines to skip:,num) while (num) { line = ps_io_fgetchars(fd,-1); if (line) *line_lenP += FD_LINE_LEN; num--; } } else { int read_chunk_size = LINE_CHUNK_SIZE; INFIMESSAGE(number of chars to skip:,num) while (num>0) { if (num <= LINE_CHUNK_SIZE) read_chunk_size=num; line = ps_io_fgetchars(fd,read_chunk_size); if (line) *line_lenP += FD_LINE_LEN; num -= read_chunk_size; } } } SKIP_UNTIL_1("EndData") } else if IS_BEGIN("Binary:") { int num; INFMESSAGE(encountered "BeginBinary:") if (sscanf(line+length("%%BeginBinary:"), "%d", &num) == 1) { int read_chunk_size = LINE_CHUNK_SIZE; INFIMESSAGE(number of chars to skip:,num) while (num>0) { if (num <= LINE_CHUNK_SIZE) read_chunk_size=num; line = ps_io_fgetchars(fd,read_chunk_size); if (line) *line_lenP += FD_LINE_LEN; num -= read_chunk_size; } SKIP_UNTIL_1("EndBinary") } } if (skipped) { INFMESSAGE(skipped lines) *line_lenP += nbytes; *lineP = skipped_line; } else { *lineP = FD_BUF+FD_LINE_BEGIN; } ENDMESSAGE(readline) return(FD_BUF+FD_LINE_BEGIN); } /*----------------------------------------------------------*/ /* readlineuntil() Read the next line in the postscript file until char is found Similar to readline, but it doesn't skip lines. */ /*----------------------------------------------------------*/ static char * readlineuntil (fd, enddoseps, lineP, positionP, line_lenP, charP) FileData fd; long enddoseps; char **lineP; long *positionP; unsigned int *line_lenP; char charP; { char *line; if (positionP) *positionP = FD_FILEPOS; do { line = ps_io_fgetchars(fd,-1); if (!line) { INFMESSAGE(could not get line) *line_lenP = 0; *lineP = empty_string; ENDMESSAGE(readline) return(NULL); } if (positionP) *positionP = FD_FILEPOS; *line_lenP = FD_LINE_LEN; *lineP = FD_BUF+FD_LINE_BEGIN; } while (line[0] != charP); return(FD_BUF+FD_LINE_BEGIN); } /*###########################################################*/ /* * pscopyuntil -- copy lines of Postscript from a section of one file * to another file until a particular comment is reached. * Automatically switch to binary copying whenever * %%BeginBinary/%%EndBinary or %%BeginData/%%EndData * comments are encountered. */ /*###########################################################*/ char * pscopyuntil(fd, to, begin, end, comment) FileData fd; FILE *to; long begin; /* set negative to avoid initial seek */ long end; char *comment; { char *line; int comment_length; BEGINMESSAGE(pscopyuntil) if (comment) { INFSMESSAGE(will copy until,comment) comment_length = strlen(comment); } else { INFMESSAGE(will copy until specified file position) comment_length = 0; } if (begin >= 0) ps_io_fseek(fd, begin); while (ps_io_ftell(fd) < end) { line = ps_io_fgetchars(fd,-1); if (!line) break; if (comment && strncmp(line, comment, comment_length) == 0) { char *cp = (char *) PS_malloc(strlen(line)+1); INFSMESSAGE(encountered specified,comment) CHECK_MALLOCED(cp); strcpy(cp, line); ENDMESSAGE(pscopyuntil) return cp; } fputs(line, to); if (!IS_COMMENT("Begin")) {} /* Do nothing */ else if IS_BEGIN("Data:") { int num; char text[101]; INFMESSAGE(encountered "BeginData:") if (FD_LINE_LEN > 100) FD_BUF[100] = '\0'; text[0] = '\0'; if (sscanf(line+length("%%BeginData:"), "%d %*s %100s", &num, text) >= 1) { if (strcmp(text, "Lines") == 0) { INFIMESSAGE(number of lines:,num) while (num) { line = ps_io_fgetchars(fd,-1); if (line) fputs(line,to); num--; } } else { int read_chunk_size = LINE_CHUNK_SIZE; INFIMESSAGE(number of chars:,num) while (num>0) { if (num <= LINE_CHUNK_SIZE) read_chunk_size=num; line = ps_io_fgetchars(fd,read_chunk_size); if (line) fwrite(line,sizeof(char),FD_LINE_LEN, to); num -= read_chunk_size; } } } } else if IS_BEGIN("Binary:") { int num; INFMESSAGE(encountered "BeginBinary:") if (sscanf(line+length("%%BeginBinary:"), "%d", &num) == 1) { int read_chunk_size = LINE_CHUNK_SIZE; INFIMESSAGE(number of chars:,num) while (num>0) { if (num <= LINE_CHUNK_SIZE) read_chunk_size=num; line = ps_io_fgetchars(fd,read_chunk_size); if (line) fwrite(line, sizeof (char),FD_LINE_LEN, to); num -= read_chunk_size; } } } } ENDMESSAGE(pscopyuntil) return NULL; } /*----------------------------------------------------------*/ /* blank */ /* Check whether the line contains nothing but white space. */ /*----------------------------------------------------------*/ static int blank(line) char *line; { char *cp = line; BEGINMESSAGE(blank) while (*cp == ' ' || *cp == '\t') cp++; ENDMESSAGE(blank) return *cp == '\n' || *cp== '\r' || (*cp == '%' && (line[0] != '%' || line[1] != '%')); } void pscopy (FILE *from, FILE *to, Document d, long begin, long end) { FileData fd; fd = ps_io_init(from); pscopyuntil(fd, to, begin, end, NULL); ps_io_exit(fd); } void pscopyheaders (FILE *from, FILE *to, Document d) { char *comment; Boolean pages_written = False; int here; FileData fd; fd = ps_io_init(from); here = d->beginheader; while ((comment=pscopyuntil(fd,to,here,d->endheader,"%%Pages:"))) { SMESSAGE(comment) here = ps_io_ftell(fd); if (pages_written) { PS_free(comment); continue; } fputs("%%Pages: (atend)\n", to); pages_written = True; PS_free(comment); } if (!pages_written && !d->epsf) fputs("%%Pages: (atend)\n", to); pscopyuntil(fd, to, d->beginpreview, d->endpreview,NULL); pscopyuntil(fd, to, d->begindefaults, d->enddefaults,NULL); pscopyuntil(fd, to, d->beginprolog, d->endprolog,NULL); pscopyuntil(fd, to, d->beginsetup, d->endsetup,NULL); ps_io_exit(fd); } void pscopypage (FILE *from, FILE *to, Document d, unsigned int page, unsigned int n_page) { FileData fd; char *comment; fd = ps_io_init(from); comment = pscopyuntil(fd,to,d->pages[page].begin,d->pages[page].end, "%%Page:"); fprintf(to, "%%%%Page: %s %d\n",d->pages[page].label, n_page); PS_free(comment); pscopyuntil(fd, to, -1, d->pages[page].end,NULL); ps_io_exit(fd); } void pscopytrailer (FILE *from, FILE *to, Document d, unsigned int n_pages) { FileData fd; Boolean pages_written = False; char *comment; int here; fd = ps_io_init(from); here = d->begintrailer; if (!d->epsf) { pscopyuntil(fd, to, here, here + strlen ("%%Trailer") + 1, NULL); here = ps_io_ftell(fd); fprintf(to, "%%%%Pages: %d\n",n_pages); } while ((comment = pscopyuntil(fd, to, here, d->endtrailer, "%%Pages:"))) { here = ps_io_ftell(fd); if (pages_written) { PS_free(comment); continue; } pages_written = True; PS_free(comment); } ps_io_exit(fd); } /*##########################################################*/ /* pscopydoc */ /* Copy the headers, marked pages, and trailer to fp */ /*##########################################################*/ void pscopydoc(dest_file,src_filename,d,pagelist) FILE *dest_file; char *src_filename; Document d; char *pagelist; { FILE *src_file; char text[PSLINELENGTH]; char *comment; Boolean pages_written = False; Boolean pages_atend = False; int pages; int page = 1; unsigned int i, j; int here; FileData fd; BEGINMESSAGE(pscopydoc) INFSMESSAGE(copying from file, src_filename) src_file = fopen(src_filename, "rb"); fd = ps_io_init(src_file); i=0; pages=0; while (pagelist[i]) { if (pagelist[i]=='*') pages++; i++; } INFIMESSAGE(number of pages to be copied,pages) here = d->beginheader; while ((comment=pscopyuntil(fd,dest_file,here,d->endheader,"%%Pages:"))) { SMESSAGE(comment) here = ps_io_ftell(fd); if (pages_written || pages_atend) { PS_free(comment); continue; } sscanf(comment+length("%%Pages:"), "%256s", text); if (strcmp(text, "(atend)") == 0) { fputs(comment, dest_file); pages_atend = True; } else { switch (sscanf(comment+length("%%Pages:"), "%*d %d", &i)) { case 1: fprintf(dest_file, "%%%%Pages: %d %d\n", pages, i); break; default: fprintf(dest_file, "%%%%Pages: %d\n", pages); break; } pages_written = True; } PS_free(comment); } pscopyuntil(fd, dest_file, d->beginpreview, d->endpreview,NULL); pscopyuntil(fd, dest_file, d->begindefaults, d->enddefaults,NULL); pscopyuntil(fd, dest_file, d->beginprolog, d->endprolog,NULL); pscopyuntil(fd, dest_file, d->beginsetup, d->endsetup,NULL); for (i = 0; i < d->numpages; i++) { if (d->pageorder == DESCEND) j = (d->numpages - 1) - i; else j = i; if (pagelist[j]=='*') { comment = pscopyuntil(fd,dest_file,d->pages[i].begin,d->pages[i].end, "%%Page:"); fprintf(dest_file, "%%%%Page: %s %d\n",d->pages[i].label, page++); PS_free(comment); pscopyuntil(fd, dest_file, -1, d->pages[i].end,NULL); } } here = d->begintrailer; while ((comment = pscopyuntil(fd, dest_file, here, d->endtrailer, "%%Pages:"))) { here = ps_io_ftell(fd); if (pages_written) { PS_free(comment); continue; } switch (sscanf(comment+length("%%Pages:"), "%*d %d", &i)) { case 1: fprintf(dest_file, "%%%%Pages: %d %d\n", pages, i); break; default: fprintf(dest_file, "%%%%Pages: %d\n", pages); break; } pages_written = True; PS_free(comment); } fclose(src_file); ps_io_exit(fd); ENDMESSAGE(pscopydoc) } #undef length /* rjl: routines to handle reading DOS EPS files */ static unsigned long dsc_arch = 0x00000001; /* change byte order if architecture is big-endian */ static PS_DWORD reorder_dword(val) PS_DWORD val; { if (*((char *)(&dsc_arch))) return val; /* little endian machine */ else return ((val&0xff) << 24) | ((val&0xff00) << 8) | ((val&0xff0000L) >> 8) | ((val>>24)&0xff); } /* change byte order if architecture is big-endian */ static PS_WORD reorder_word(val) PS_WORD val; { if (*((char *)(&dsc_arch))) return val; /* little endian machine */ else return (PS_WORD) ((PS_WORD)(val&0xff) << 8) | (PS_WORD)((val&0xff00) >> 8); } /* DOS EPS header reading */ static unsigned long ps_read_doseps(fd,doseps) FileData fd; DOSEPS *doseps; { fread(doseps->id, 1, 4, FD_FILE); if (! ((doseps->id[0]==0xc5) && (doseps->id[1]==0xd0) && (doseps->id[2]==0xd3) && (doseps->id[3]==0xc6)) ) { /* id is "EPSF" with bit 7 set */ ps_io_rewind(fd); return 0; /* OK */ } fread(&doseps->ps_begin, 4, 1, FD_FILE); /* PS offset */ doseps->ps_begin = (unsigned long)reorder_dword(doseps->ps_begin); fread(&doseps->ps_length, 4, 1, FD_FILE); /* PS length */ doseps->ps_length = (unsigned long)reorder_dword(doseps->ps_length); fread(&doseps->mf_begin, 4, 1, FD_FILE); /* Metafile offset */ doseps->mf_begin = (unsigned long)reorder_dword(doseps->mf_begin); fread(&doseps->mf_length, 4, 1, FD_FILE); /* Metafile length */ doseps->mf_length = (unsigned long)reorder_dword(doseps->mf_length); fread(&doseps->tiff_begin, 4, 1, FD_FILE); /* TIFF offset */ doseps->tiff_begin = (unsigned long)reorder_dword(doseps->tiff_begin); fread(&doseps->tiff_length, 4, 1, FD_FILE); /* TIFF length */ doseps->tiff_length = (unsigned long)reorder_dword(doseps->tiff_length); fread(&doseps->checksum, 2, 1, FD_FILE); doseps->checksum = (unsigned short)reorder_word(doseps->checksum); ps_io_fseek(fd, doseps->ps_begin); /* seek to PS section */ return doseps->ps_begin + doseps->ps_length; } int psgetpagebbox (const struct document *doc, int page, int *urx, int *ury, int *llx, int *lly) { int new_llx = 0; int new_lly = 0; int new_urx = 0; int new_ury = 0; if ((page >= 0) && (doc->pages) && (doc->pages[page].boundingbox[URX] > doc->pages[page].boundingbox[LLX]) && (doc->pages[page].boundingbox[URY] > doc->pages[page].boundingbox[LLY])) { /* use page bbox */ new_llx = doc->pages[page].boundingbox[LLX]; new_lly = doc->pages[page].boundingbox[LLY]; new_urx = doc->pages[page].boundingbox[URX]; new_ury = doc->pages[page].boundingbox[URY]; } else if ((doc->boundingbox[URX] > doc->boundingbox[LLX]) && (doc->boundingbox[URY] > doc->boundingbox[LLY])) { /* use doc bbox */ new_llx = doc->boundingbox[LLX]; new_lly = doc->boundingbox[LLY]; new_urx = doc->boundingbox[URX]; new_ury = doc->boundingbox[URY]; } *llx = new_llx; *lly = new_lly; *urx = new_urx; *ury = new_ury; return (new_llx != 0 || new_lly != 0 || new_urx != 0 || new_ury != 0); } /* From Evince */ #define DEFAULT_PAGE_SIZE 1 void psgetpagebox (const struct document *doc, int page, int *urx, int *ury, int *llx, int *lly) { int new_llx = 0; int new_lly = 0; int new_urx = 0; int new_ury = 0; int new_pagesize = -1; if (new_pagesize == -1) { new_pagesize = DEFAULT_PAGE_SIZE; if (doc) { /* If we have a document: * We use -- the page size (if specified) * or the doc. size (if specified) * or the page bbox (if specified) * or the bounding box */ if ((page >= 0) && (doc->numpages > (unsigned int)page) && (doc->pages) && (doc->pages[page].media)) { new_pagesize = doc->pages[page].media - doc->media; } else if (doc->default_page_media != NULL) { new_pagesize = doc->default_page_media - doc->media; } else if ((page >= 0) && (doc->numpages > (unsigned int)page) && (doc->pages) && (doc->pages[page].boundingbox[URX] > doc->pages[page].boundingbox[LLX]) && (doc->pages[page].boundingbox[URY] > doc->pages[page].boundingbox[LLY])) { new_pagesize = -1; } else if ((doc->boundingbox[URX] > doc->boundingbox[LLX]) && (doc->boundingbox[URY] > doc->boundingbox[LLY])) { new_pagesize = -1; } } } /* Compute bounding box */ if (doc && (doc->epsf || new_pagesize == -1)) { /* epsf or bbox */ psgetpagebbox (doc, page, &new_urx, &new_ury, &new_llx, &new_lly); } else { if (new_pagesize < 0) new_pagesize = DEFAULT_PAGE_SIZE; new_llx = new_lly = 0; if (doc && doc->media && ((unsigned int)new_pagesize < doc->nummedia)) { new_urx = doc->media[new_pagesize].width; new_ury = doc->media[new_pagesize].height; } else { new_urx = papersizes[new_pagesize].width; new_ury = papersizes[new_pagesize].height; } } if (new_urx <= new_llx) new_urx = papersizes[12].width; if (new_ury <= new_lly) new_ury = papersizes[12].height; *urx = new_urx; *ury = new_ury; *llx = new_llx; *lly = new_lly; }