eval '(exit $?0)' && eval 'exec perl -S $0 ${1+"$@"}' && eval 'exec perl -S $0 $argv:q' if 0; use strict; # $Id: epstopdf.pl 16244 2009-11-30 01:36:08Z karl $ # (Copyright lines below.) # # Redistribution and use in source and binary forms, with or without # modification, are permitted provided that the following conditions are met: # # 1. Redistributions of source code must retain the above copyright # notice, this list of conditions and the following disclaimer. # 2. Redistributions in binary form must reproduce the above copyright # notice, this list of conditions and the following disclaimer in the # documentation and/or other materials provided with the distribution. # 3. The name of the author may not be used to endorse or promote # products derived from this software without specific prior written # permission. # # THIS SOFTWARE IS PROVIDED BY THE AUTHOR ``AS IS'' AND ANY EXPRESS OR # IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE IMPLIED # WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE # DISCLAIMED. IN NO EVENT SHALL THE AUTHOR BE LIABLE FOR ANY DIRECT, # INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL DAMAGES # (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR # SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) # HOWEVER CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, # STRICT LIABILITY, OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN # ANY WAY OUT OF THE USE OF THIS SOFTWARE, EVEN IF ADVISED OF THE # POSSIBILITY OF SUCH DAMAGE. # # ---------------------------------------------------------------- # # This is a script to transform an EPS file such that: # a) it is guaranteed to start at the 0,0 coordinate. # b) it sets a page size exactly corresponding to the BoundingBox # This means that when Ghostscript renders it, the result needs no # cropping, and the PDF MediaBox is correct. # c) the result is piped to Ghostscript and a PDF version written. # # It needs a Level 2 PS interpreter. # If the bounding box is not right, of course, there will be problems. # # One thing not allowed for is the case of # "%%BoundingBox: (atend)" when input is not seekable (e.g., from a pipe), # which is more complicated. # # emacs-page # History # 2009/11/27 v2.12 (Karl Berry) # * Make --filter work again # 2009/11/25 (Manuel P\'egouri\'e-Gonnard) # * Better extension detection, suggested by A. Cherepanov. # 2009/10/18 (Manuel P\'egouri\'e-Gonnard) # * Better argument validation (Alexander Cherepanov). # * Use list form of pipe open() (resp. system()) to prevent injection. # Since Perl's fork() emulation doesn't work on Windows with Perl 5.8.8 from # TeX Live 2009, use a temporary file instead of a pipe on Windows. # 2009/10/14 (Manuel P\'egouri\'e-Gonnard) # * Added restricted mode. # 2009/09/27 v2.11 (Karl Berry) # * Fixed two bugs in the (atend) handling code (Martin von Gagern) # * Improved handling of CR line ending (Martin von Gagern) # * More error checking # * --version option # * Create source repository in TeX Live # 2009/07/17 v2.9.11gw # * Added -dSAFER to default gs options # TL2009 wants to use a restricted variant of -shell-escape, # allowing epstopdf to run. However without -dSAFER Ghostscript # allows writing to files (other than given in -sOutputFile) # and running commands (through Ghostscript pipe's language feature). # 2009/05/09 v2.9.10gw # * Changed cygwin name for ghostscript to gs # 2008/08/26 v2.9.9gw # * Switch to embed fonts (default=yes) (J.P. Chretien) # * turned no AutoRotatePages into an option (D. Kreil) (default = None) # * Added resolution switch (D. Kreil) # * Added BSD-style license # 2007/07/18 v2.9.8gw # 2007/05/18 v.2.9.7gw (Gerben Wierda) # * Merged both supplied 2.9.6 versions # 2007/05/15 v2.9.6tp (Theo Papadopoulo) # * Simplified the (atend) support # 2007/01/24 v2.9.6sw (Staszek Wawrykiewicz) # * patched to work also on Windows # 2005/10/06 v2.9.5gw (Gerben Wierda) # * Fixed a horrendous bug in the (atend) handling code # 2005/10/06 v2.9.4gw (Gerben Wierda) # * This has become the official version for now # 2005/10/01 v2.9.3draft (Gerben Wierda) # * Quote OutFilename # 2005/09/29 v2.9.2draft (Gerben Wierda) # * Quote OutFilename # 2004/03/17 v2.9.1draft (Gerben Wierda) # * No autorotate page # 2003/04/22 v2.9draft (Gerben Wierda) # * Fixed bug where with cr-eol files everything up to the first %! # * in the first 2048 bytes was gobbled (double ugh!) # 2002/02/21 v2.8draft (Gerben Wierda) # * Fixed bug where last line of buffer was not copied out (ugh!) # 2002/02/18 v2.8draft (Gerben Wierda) # * Handle different eol styles transparantly # * Applied fix from Peder Axensten for Freehand bug # 2001/03/05 v2.7 (Heiko Oberdiek) # * Newline before grestore for the case that there is no # whitespace at the end of the eps file. # 2000/11/05 v2.6 (Heiko Oberdiek) # * %%HiresBoundingBox corrected to %%HiResBoundingBox # 1999/05/06 v2.5 (Heiko Oberdiek) # * New options: --hires, --exact, --filter, --help. # * Many cosmetics: title, usage, ... # * New code for debug, warning, error # * Detecting of cygwin perl # * Scanning for %%{Hires,Exact,}BoundingBox. # * Scanning only the header in order not to get a wrong # BoundingBox of an included file. # * (atend) supported. # * uses strict; (earlier error detecting). # * changed first comment from '%!PS' to '%!'; # * corrected (atend) pattern: '\s*\(atend\)' # * using of $bbxpat in all BoundingBox cases, # correct the first white space to '...Box:\s*$bb...' # * corrected first line (one line instead of two before 'if 0;'; # # Thomas Esser, Sept. 1998: change initial lines to find # perl along $PATH rather than guessing a fixed location. The above # construction should work with most shells. # # Originally by Sebastian Rahtz, for Elsevier Science # with extra tricks from Hans Hagen's texutil and many more. # emacs-page ### program identification my $program = "epstopdf"; my $ident = '($Id: epstopdf.pl 16244 2009-11-30 01:36:08Z karl $) 2.12'; my $copyright = < This is free software: you are free to change and redistribute it. There is NO WARRANTY, to the extent permitted by law. END_COPYRIGHT my $title = "$program $ident\n"; ### ghostscript command name my $GS = "gs"; $GS = "gswin32c" if $^O eq 'MSWin32'; ### restricted mode my $restricted = 0; $restricted = 1 if $0 =~ /repstopdf/; ### options $::opt_outfile=""; $::opt_compress=1; $::opt_debug=0; $::opt_embed=1; $::opt_exact=0; $::opt_filter=0; $::opt_gs=1; $::opt_hires=0; $::opt_gscmd=""; $::opt_res=0; $::opt_autorotate="None"; ### usage my @bool = ("false", "true"); my $resmsg = $::opt_res ? $::opt_res : "[use gs default]"; my $rotmsg = $::opt_autorotate ? $::opt_autorotate : "[use gs default]"; my $usage = <<"END_OF_USAGE"; ${title}Usage: $program [OPTION]... [EPSFILE] Convert EPS to PDF, by default using Ghostscript. Options: --help display this help and exit --version display version information and exit --outfile=FILE write result to FILE --(no)compress use compression (default: $bool[$::opt_compress]) --(no)debug write debugging info (default: $bool[$::opt_debug]) --(no)embed embed fonts (default: $bool[$::opt_embed]) --(no)exact scan ExactBoundingBox (default: $bool[$::opt_exact]) --(no)filter read standard input (default: $bool[$::opt_filter]) --(no)gs run ghostscript (default: $bool[$::opt_gs]) --(no)hires scan HiResBoundingBox (default: $bool[$::opt_hires]) --gscmd=VAL pipe output to VAL (default: $GS) --res=DPI set image resolution (default: $resmsg) --autorotate=VAL set AutoRotatePages (default: $rotmsg) Recognized VAL choices: None, All, PageByPage For EPS files, PageByPage is equivalent to All --restricted use restricted mode (default: $bool[$restricted]) Examples for producing 'test.pdf': * $program test.eps * produce postscript | $program --filter >test.pdf * produce postscript | $program -f -d -o=test.pdf Example: look for HiResBoundingBox and produce corrected PostScript: * $program -d --nogs --hires test.ps >testcorr.ps When reporting bugs, please include an input file and command line options so the problem can be reproduced. Report bugs to: tex-k\@tug.org epstopdf home page: END_OF_USAGE ### process options use Getopt::Long; GetOptions ( "help", "version", "outfile=s", # \ref{openout_any} "compress!", "debug!", "embed!", "exact!", "filter!", "gs!", "hires!", "gscmd=s", # \ref{val_gscmd} "res=i", # validated by Getopt ('i' specifier) "autorotate=s", # \ref{val_autorotate} "restricted", ) or die $usage; ### help functions sub debug { print STDERR "* @_\n" if $::opt_debug; } sub warning { print STDERR "==> Warning: @_\n"; } sub error { die "$title!!! Error: @_\n"; } sub errorUsage { die "$usage\n!!! Error: @_\n"; } ### restricted option $restricted = 1 if $::opt_restricted; debug "Restricted mode activated" if $restricted; ### help, version options. if ($::opt_help) { print $usage; exit (0); } if ($::opt_version) { print $title; print $copyright; exit (0); } ### get input filename my $InputFilename = ""; if ($::opt_filter) { @ARGV == 0 or die errorUsage "Input file cannot be used with filter option"; debug "Filtering: will read standard input"; } else { @ARGV > 0 or die errorUsage "Input filename missing"; @ARGV < 2 or die errorUsage "Unknown option or too many input files"; $InputFilename = $ARGV[0]; #-r $InputFilename or error "\"$InputFilename\" not readable"; debug "Input filename:", $InputFilename; } ### option gscmd if ($::opt_gscmd) { debug "Switching from $GS to $::opt_gscmd"; $GS = $::opt_gscmd; # validate GS \label{val_gscmd} if ($restricted) { $GS =~ /^(gs|mgs|gswin32c|gs386|gsos2)\z/ or $GS =~ /^gs[\-_]?(\d|\d[\.-_]?\d\d)c?\z/ or die error "Value of gscmd '$GS' not allowed in restricted mode."; } } ### start building GS command line for the pipe my @GS = ($GS); push @GS, qw(-q -dNOPAUSE -dSAFER -sDEVICE=pdfwrite); ### option outfile my $OutputFilename = $::opt_outfile; if ($OutputFilename eq "") { if ($::opt_gs) { $OutputFilename = $InputFilename; if (!$::opt_filter) { my $ds = ($^O eq "MSWin32" || $^O eq "cygwin") ? '\\/' : '/'; $OutputFilename =~ s/\.[^\.$ds]*$//; $OutputFilename .= ".pdf"; } } else { $OutputFilename = "-"; # no ghostscript, write to standard output } } if ($::opt_filter) { debug "Filtering: will write standard output"; $OutputFilename = "-"; } else { debug "Output filename:", $OutputFilename; } push @GS, "-sOutputFile=$OutputFilename"; ### options compress, embed, res, autorotate push @GS, ('-dPDFSETTINGS=/prepress', '-dMaxSubsetPct=100', '-dSubsetFonts=true', '-dEmbedAllFonts=true') if $::opt_embed; push @GS, '-dUseFlateCompression=false' unless $::opt_compress; push @GS, "-r$::opt_res" if $::opt_res; $resmsg= $::opt_res ? $::opt_res : "[use gs default]"; push @GS, "-dAutoRotatePages=/$::opt_autorotate" if $::opt_autorotate; $rotmsg = $::opt_autorotate ? $::opt_autorotate : "[use gs default]"; # \label{val_autorotate} error "Invalid value for autorotate: '$::opt_autorotate' " . "(use 'All', 'None' or 'PageByPage')." if ($::opt_autorotate and not $::opt_autorotate =~ /^(None|All|PageByPage)\z/); ### option BoundingBox types my $BBName = "%%BoundingBox:"; !($::opt_hires and $::opt_exact) or error "Options --hires and --exact cannot be used together"; $BBName = "%%HiResBoundingBox:" if $::opt_hires; $BBName = "%%ExactBoundingBox:" if $::opt_exact; debug "BoundingBox comment:", $BBName; ### validate output file name in restricted mode \label{openout_any} use File::Spec::Functions qw(splitpath file_name_is_absolute); if ($restricted) { # use the equivalent of openout_any = p # (see opennameok() web2c/lib/texmfmp.c) # Well, for now, be even more paranoid: don't allow absolute path at all my $ok = 1; # disallow opening dot-files on Unix unless ($^O eq "MSWin32") { my ($drive, $path, $basename) = splitpath($OutputFilename); $ok = 0 if $basename =~ /^\./; } # disallow absolute path $ok = 0 if file_name_is_absolute($OutputFilename); # disallow colon on Windows. It could be used either after a drive # (like "a:dir\file") or for an alternate data stream (like # "file:ads"). if ($^O eq "MSWin32" || $^O eq "cygwin") { $ok = 0 if $OutputFilename =~ /:/; } # disallow going to parent directory my $ds = ($^O eq "MSWin32" || $^O eq "cygwin") ? qr([\\/]) : qr(/); $ok = 0 if $OutputFilename =~ /^\.\.$ds|$ds\.\.$ds/; # we passed all tests die error "Output filename '$OutputFilename' not allowed in restricted mode." unless $ok; } ### option gs if ($::opt_gs) { debug "Ghostscript command:", $GS; debug "Compression:", ($::opt_compress) ? "on" : "off"; debug "Embedding:", ($::opt_embed) ? "on" : "off"; debug "Rotation:", $rotmsg; debug "Resolution:", $resmsg; } ### emacs-page ### open input file if ($::opt_filter) { open(IN, '<-') || error("Cannot open stdin: $!"); } else { open(IN, '<', $InputFilename) || error("Cannot open $InputFilename: $!"); } binmode IN; ### open output file my $outname; # used in error message at end my $tmp_filename; # temporary file for windows my $OUT; # filehandle for output (GS pipe or temporary file) use File::Temp 'tempfile'; if ($::opt_gs) { unless ($^O eq 'MSWin32' || $^O eq 'cygwin') { # list piped open works push @GS, qw(- -c quit); debug "Ghostscript pipe:", join(' ', @GS); open($OUT, '|-', @GS) or error "Cannot open Ghostscript for piped input"; } else { # use a temporary file on Windows/Cygwin. ($OUT, $tmp_filename) = tempfile(UNLINK => 1); debug "Using temporary file '$tmp_filename'"; } $outname = $GS; } else { open($OUT, '>', $OutputFilename) or error "Cannot write \"$OutputFilename\""; $outname = $OutputFilename; } binmode $OUT; # reading a cr-eol file on a lf-eol system makes it impossible to parse # the header and besides it will read the intire file into yor line by line # scalar. this is also true the other way around. ### emacs-page ### scan a block, try to determine eol style my $buf; my $buflen; my @bufarray; my $inputpos; # We assume 2048 is big enough. my $EOLSCANBUFSIZE = 2048; $buflen = read(IN, $buf, $EOLSCANBUFSIZE); if ($buflen > 0) { my $crlfpos; my $lfpos; my $crpos; $inputpos = 0; # remove binary junk before header # if there is no header, we assume the file starts with ascii style and # we look for a eol style anyway, to prevent possible loading of the # entire file if ($buf =~ /%!/) { # throw away binary junk before %! $buf =~ s/(.*?)%!/%!/o; $inputpos = length($1); } $lfpos = index($buf, "\n"); $crpos = index($buf, "\r"); $crlfpos = index($buf, "\r\n"); if ($crpos > 0 and ($lfpos == -1 or $lfpos > $crpos+1)) { # The first eol was a cr and it was not immediately followed by a lf $/ = "\r"; debug "The first eol character was a CR ($crpos) and not immediately followed by a LF ($lfpos)"; } # Now we have set the correct eol-character. Get one more line and add # it to our buffer. This will make the buffer contain an entire line # at the end. Then split the buffer in an array. We will draw lines from # that array until it is empty, then move again back to $buf .= unless eof(IN); $buflen = length($buf); # Some extra magic is needed here: if we set $/ to \r, Perl's re engine # still thinks eol is \n in regular expressions (not very nice) so we # cannot split on ^, but have to split on a look-behind for \r. if ($/ eq "\r") { @bufarray = split(/(?<=\r)/ms, $buf); # split after \r } else { @bufarray = split(/^/ms, $buf); } } ### getline sub getline { if ($#bufarray >= 0) { $_ = shift(@bufarray); } else { $_ = ; } $inputpos += length($_) if defined $_; return defined($_); } ### scan first line my $header = 0; getline(); if (/%!/) { # throw away binary junk before %! s/(.*)%!/%!/o; } $header = 1 if /^%/; debug "Scanning header for BoundingBox"; print $OUT $_; ### variables and pattern for BoundingBox search my $bbxpatt = '[0-9eE\.\-]'; # protect backslashes: "\\" gets '\' my $BBValues = "\\s*($bbxpatt+)\\s+($bbxpatt+)\\s+($bbxpatt+)\\s+($bbxpatt+)"; my $BBCorrected = 0; sub CorrectBoundingBox { my ($llx, $lly, $urx, $ury) = @_; debug "Old BoundingBox:", $llx, $lly, $urx, $ury; my ($width, $height) = ($urx - $llx, $ury - $lly); my ($xoffset, $yoffset) = (-$llx, -$lly); debug "New BoundingBox: 0 0", $width, $height; debug "Offset:", $xoffset, $yoffset; print $OUT "%%BoundingBox: 0 0 $width $height$/"; print $OUT "<< /PageSize [$width $height] >> setpagedevice$/"; print $OUT "gsave $xoffset $yoffset translate$/"; } ### emacs-page ### scan header if ($header) { HEADER: while (getline()) { ### Fix for freehand bug ### by Peder Axensten next HEADER if(!/\S/); ### end of header if (!/^%/ or /^%%EndComments/) { print $OUT $_; last; } ### BoundingBox with values if (/^$BBName$BBValues/o) { CorrectBoundingBox $1, $2, $3, $4; $BBCorrected = 1; last; } ### BoundingBox with (atend) if (/^$BBName\s*\(atend\)/) { debug $BBName, "(atend)"; if ($::opt_filter) { warning "Cannot look for BoundingBox in the trailer", "with option --filter"; last; } my $pos = $inputpos; debug "Current file position:", $pos; # looking for %%BoundingBox while (getline()) { # skip over included documents my $nestDepth = 0; $nestDepth++ if /^%%BeginDocument/; $nestDepth-- if /^%%EndDocument/; if ($nestDepth == 0 && /^$BBName$BBValues/o) { CorrectBoundingBox $1, $2, $3, $4; $BBCorrected = 1; last; } } # go back seek(IN, $pos, 0) or error "Cannot go back to line \"$BBName (atend)\""; last; } # print header line print $OUT $_; } } ### print rest of file while (getline()) { print $OUT $_; } ### emacs-page ### close files close(IN); print $OUT "$/grestore$/" if $BBCorrected; close($OUT); ### actually run GS if we were writing to a temporary file if (defined $tmp_filename) { push @GS, $tmp_filename; push @GS, qw(-c quit); debug "Ghostscript command:", join(' ', @GS); system @GS; } # if ghostscript exited badly, we should too. if ($? & 127) { error(sprintf "Writing to $outname failed, signal %d\n", $? & 127); } elsif ($? != 0) { error(sprintf "Writing to $outname failed, error code %d\n", $? >> 8); } warning "BoundingBox not found" unless $BBCorrected; debug "Done.";