Sha256: c79440f70490cca467289d26ddd1a2f36f8bbd915d731bede99f8ccd6a71b8ec

Contents?: true

Size: 1.03 KB

Versions: 7

Compression:

Stored size: 1.03 KB

Contents

module Docsplit

  # Delegates to **pdftk** in order to create bursted single pages from
  # a PDF document.
  class PageExtractor

    # Burst a list of pdfs into single pages, as `pdfname_pagenumber.pdf`.
    def extract(pdfs, opts)
      extract_options opts
      [pdfs].flatten.each do |pdf|
        pdf_name = File.basename(pdf, File.extname(pdf))
        page_path = ESCAPE[File.join(@output, "#{pdf_name}")] + "_%d.pdf"
        FileUtils.mkdir_p @output unless File.exists?(@output)
        
        cmd = if DEPENDENCIES[:pdftailor] # prefer pdftailor, but keep pdftk for backwards compatability
          "pdftailor unstitch --output #{page_path} #{ESCAPE[pdf]} 2>&1"
        else
          "pdftk #{ESCAPE[pdf]} burst output #{page_path} 2>&1"
        end
        result = `#{cmd}`.chomp
        FileUtils.rm('doc_data.txt') if File.exists?('doc_data.txt')
        raise ExtractionFailed, result if $? != 0
        result
      end
    end


    private

    def extract_options(options)
      @output = options[:output] || '.'
    end

  end

end

Version data entries

7 entries across 7 versions & 4 rubygems

Version Path
docsplit-ng-0.8.0 lib/docsplit/page_extractor.rb
luccasmaso-docsplit-0.7.4.2 lib/docsplit/page_extractor.rb
burisu-docsplit-0.7.8 lib/docsplit/page_extractor.rb
docsplit-0.8.0.alpha1 lib/docsplit/page_extractor.rb
docsplit-0.8.0.alpha lib/docsplit/page_extractor.rb
docsplit-0.7.6 lib/docsplit/page_extractor.rb
burisu-docsplit-0.7.7 lib/docsplit/page_extractor.rb