#!/usr/bin/env ruby # == Name # # pdfmult - put multiple copies of a PDF page on one page # # == Description # # +pdfmult+ rearranges multiple copies of a PDF page (shrunken) on one page. # # == See also # # Use pdfmult --help to display a brief help message. # # The full documentation for +pdfmult+ is available on the # project home page. # # == Author # # Copyright (C) 2011-2013 Marcus Stollsteimer # # License GPLv3+: GNU GPL version 3 or later require 'optparse' require 'tempfile' require 'open3' require 'erb' # This module contains the classes for the +pdfmult+ tool. module Pdfmult PROGNAME = 'pdfmult' VERSION = '1.3.1' DATE = '2013-01-04' HOMEPAGE = 'https://github.com/stomar/pdfmult/' TAGLINE = 'puts multiple copies of a PDF page on one page' COPYRIGHT = "Copyright (C) 2011-2013 Marcus Stollsteimer.\n" + "License GPLv3+: GNU GPL version 3 or later .\n" + "This is free software: you are free to change and redistribute it.\n" + "There is NO WARRANTY, to the extent permitted by law." PDFLATEX = '/usr/bin/pdflatex' KPSEWHICH = '/usr/bin/kpsewhich' # Parser for the command line options. # The class method parse! does the job. class Optionparser # Parses the command line options from +argv+. # (+argv+ is cleared). # Might print out help or version information. # # +argv+ - array with the command line options # # Returns a hash containing the option parameters. def self.parse!(argv) options = { :force => false, :infile => nil, :latex => false, :number => 2, :outfile => nil, :silent => false, :pages => nil } opt_parser = OptionParser.new do |opt| opt.banner = "Usage: #{PROGNAME} [options] file" opt.separator '' opt.separator 'pdfmult is a command line tool that' opt.separator 'rearranges multiple copies of a PDF page (shrunken) on one page.' opt.separator '' opt.separator 'The paper size of the produced PDF file is A4,' opt.separator 'the input file is also assumed to be in A4 format.' opt.separator 'The input PDF file may consist of several pages.' opt.separator 'If pdfmult succeeds in obtaining the page count it will rearrange all pages,' opt.separator 'if not, only the first page is processed' opt.separator '(unless the page count was specified via command line option).' opt.separator '' opt.separator 'pdfmult uses pdflatex with the pdfpages package,' opt.separator 'so both have to be installed on the system.' opt.separator 'If the --latex option is used, though, pdflatex is not run' opt.separator 'and a LaTeX file is created instead of a PDF.' opt.separator '' opt.separator 'Options' opt.separator '' # process --version and --help first, # exit successfully (GNU Coding Standards) opt.on_tail('-h', '--help', 'Print a brief help message and exit.') do puts opt_parser puts "\nReport bugs on the #{PROGNAME} home page: <#{HOMEPAGE}>" exit end opt.on_tail('-v', '--version', 'Print a brief version information and exit.') do puts "#{PROGNAME} #{VERSION}" puts COPYRIGHT exit end opt.on('-n', '--number NUMBER', ['2', '4', '8', '9', '16'], Integer, 'Number of copies to put on one page: 2 (default), 4, 8, 9, 16.') do |n| options[:number] = n end opt.on('-f', '--[no-]force', 'Do not prompt before overwriting.') do |f| options[:force] = f end opt.on('-l', '--latex', 'Create a LaTeX file instead of a PDF file (default: file_2.tex).') do options[:latex] = true end opt.on('-o', '--output FILE', String, 'Output file (default: file_2.pdf). Use - to output to stdout.') do |f| options[:outfile] = f end opt.on('-p', '--pages NUMBER', Integer, 'Number of pages to convert.', "If given, #{PROGNAME} does not try to obtain the page count from the source PDF.") do |p| raise(OptionParser::InvalidArgument, p) unless p > 0 options[:pages] = p end opt.on('-s', '--[no-]silent', 'Do not output progress information.') do |s| options[:silent] = s end opt.separator '' end opt_parser.parse!(argv) # only input file should be left in argv raise(ArgumentError, 'wrong number of arguments') if (argv.size != 1 || argv[0].empty?) options[:infile] = argv.pop # set output file unless set by option ext = options[:latex] ? 'tex' : 'pdf' infile_without_ext = options[:infile].gsub(/(.pdf)\Z/, '') options[:outfile] ||= "#{infile_without_ext}_#{options[:number].to_s}.#{ext}" options end end # Class for the page layout. # # Create an instance with Layout.new, specifying # the number of pages to put on one page. # Layout#geometry returns the geometry string. class Layout attr_reader :pages, :geometry GEOMETRY = { 2 => '2x1', 4 => '2x2', 8 => '4x2', 9 => '3x3', 16 => '4x4' } def initialize(pages) @pages = pages @geometry = GEOMETRY[pages] end def landscape? ['2x1', '4x2'].include?(geometry) end end # Class for the LaTeX document. # # Create an instance with LaTeXDocument.new, specifying # the input file, the number of pages to put on one page, # and the page count of the input file. # # The method +to_s+ returns the document as multiline string. class LaTeXDocument TEMPLATE = %q( \documentclass[<%= class_options %>]{article} \usepackage{pdfpages} \pagestyle{empty} \setlength{\parindent}{0pt} \begin{document} % pages_strings.each do |pages| \includepdf[pages={<%= pages %>},nup=<%= geometry %>]{<%= @pdffile %>}% % end \end{document} ).gsub(/\A\n/,'').gsub(/^ +/, '') # Initializes a LaTeXDocument instance. # Expects an argument hash with: # # +:pdffile+ - filename of input pdf file # +:layout+ - page layout # +:page_count+ - page count of the input file def initialize(args) @pdffile = args[:pdffile] @layout = args[:layout] @page_count = args[:page_count] end def to_s class_options = "a4paper" class_options << ',landscape' if @layout.landscape? latex = ERB.new(TEMPLATE, 0, '%<>') latex.result(binding) end private def geometry @layout.geometry end # Returns an array of pages strings. # For 4 copies and 2 pages: ["1,1,1,1", "2,2,2,2"]. def pages_strings template = 'PAGE,' * (@layout.pages - 1) + 'PAGE' Array.new(@page_count) {|i| template.gsub(/PAGE/, "#{i+1}") } end end # A class for PDF meta data (up to now only used for the page count). # # Create an instance with PDFInfo.new, specifying the file name. # +PDFInfo+ tries to use the +pdfinfo+ system tool to obtain meta data. # If successful, the attribute +page_count+ contains the page count, # else the attribute is set to +nil+. class PDFInfo PDFINFOCMD = '/usr/bin/pdfinfo' # Returns the page count of the input file, or nil. attr_reader :page_count # This is the initialization method for the class. # # +file+ - file name of the PDF file def initialize(file, options={}) @file = file @binary = options[:pdfinfocmd] || PDFINFOCMD # for unit tests @infos = retrieve_infos @page_count = @infos['Pages'] && @infos['Pages'].to_i end private # Tries to retrieve the PDF infos for the file; returns an info hash. def retrieve_infos command = "#{@binary} #{@file}" return {} unless Application.command_available?(command) info_array = `#{command}`.split(/\n/) Hash[info_array.map {|line| line.split(/\s*:\s*/, 2) }] end # Returns true if default +pdfinfo+ system tool is available (for unit tests). def self.infocmd_available? Application.command_available?("#{PDFINFOCMD} -v") end end # The main program. It's run! method is called # if the script is run from the command line. # It parses the command line arguments and does the job. class Application ERRORCODE = {:general => 1, :usage => 2} # The main program. def self.run! # parse options begin options = Optionparser.parse!(ARGV) rescue => e usage_fail(e.message) end infile = options[:infile] outfile = options[:outfile] use_stdout = (outfile == '-') silent = options[:silent] # test for pdflatex installation unless options[:latex] message = 'seems not to be installed (you might try using the -l option)' general_fail("`#{PDFLATEX}' #{message}") unless command_available?("#{PDFLATEX} --version") general_fail("`pdfpages.sty' #{message}") unless command_available?("#{KPSEWHICH} pdfpages.sty") end # test input file usage_fail("no such file: `#{infile}'") unless File.exist?(infile) usage_fail("specified input not of the type `file'") unless File.ftype(infile) == 'file' # test for existing output file if !use_stdout and !options[:force] and File.exist?(outfile) overwrite_ok = ask("File `#{outfile}' already exists. Overwrite?") exit unless overwrite_ok end # set page number (get PDF info if necessary) pages = options[:pages] || PDFInfo.new(infile).page_count || 1 # create LaTeX document args = { :pdffile => infile, :layout => Layout.new(options[:number]), :page_count => pages } document = LaTeXDocument.new(args) output = nil if options[:latex] output = document.to_s else Dir.mktmpdir('pdfmult') do |dir| texfile = 'pdfmult.tex' pdffile = 'pdfmult.pdf' open("#{dir}/#{texfile}", 'w') {|f| f.write(document.to_s) } command = "#{PDFLATEX} -output-directory #{dir} #{texfile}" Open3.popen3(command) do |stdin, stdout, stderr| stdout.each_line {|line| warn line.chomp } unless silent # redirect progress messages to stderr stderr.read # make sure all streams are read (and command has finished) end output = File.read("#{dir}/#{pdffile}") end end # redirect stdout to output file $stdout.reopen(outfile, 'w') unless use_stdout warn "Writing on #{outfile}." unless (use_stdout || silent) puts output end # Asks for yes or no (y/n). # # +question+ - string to be printed # # Returns +true+ if the answer is yes. def self.ask(question) # :nodoc: loop do $stderr.print "#{question} [y/n] " reply = $stdin.gets.chomp.downcase # $stdin: avoids gets / ARGV problem return true if reply == 'y' return false if reply == 'n' warn "Please answer `y' or `n'." end end # Prints an error message and exits. def self.general_fail(message) # :nodoc: warn "#{PROGNAME}: #{message}" exit ERRORCODE[:general] end # Prints an error message and a short help information, then exits. def self.usage_fail(message) # :nodoc: warn "#{PROGNAME}: #{message}" warn "Use `#{PROGNAME} --help' for valid options." exit ERRORCODE[:usage] end # Tests silently whether the given system command is available. # # +command+ - command to test def self.command_available?(command) # :nodoc: !!system("#{command} >/dev/null 2>&1") end end ### call main method only if called on command line if __FILE__ == $0 Application.run! end end # module