require_relative 'core_ext/string' autoload :FileUtils, 'fileutils' autoload :Open3, 'open3' autoload :Shellwords, 'shellwords' module Asciidoctor module Epub3 module GepubBuilderMixin DATA_DIR = ::File.expand_path(::File.join ::File.dirname(__FILE__), '..', '..', 'data') SAMPLES_DIR = ::File.join DATA_DIR, 'samples' WordJoinerRx = Epub3::WordJoinerRx FromHtmlSpecialCharsMap = ContentConverter::FromHtmlSpecialCharsMap FromHtmlSpecialCharsRx = ContentConverter::FromHtmlSpecialCharsRx CsvDelimiterRx = /\s*,\s*/ DefaultCoverImage = 'images/default-cover.png' InlineImageMacroRx = /^image:(.*?)\[(.*?)\]$/ def sanitized_doctitle doc, target = :plain return (doc.attr 'untitled-label') unless doc.header? title = case target when :attribute_cdata doc.doctitle(sanitize: true).gsub('"', '"') when :element_cdata doc.doctitle sanitize: true when :pcdata doc.doctitle when :plain doc.doctitle(sanitize: true).gsub(FromHtmlSpecialCharsRx, FromHtmlSpecialCharsMap) end title.gsub WordJoinerRx, '' end def add_theme_assets doc builder = self format = @format workdir = if doc.attr? 'epub3-stylesdir' stylesdir = doc.attr 'epub3-stylesdir' # FIXME make this work for Windows paths!! if stylesdir.start_with? '/' stylesdir else docdir = doc.attr 'docdir', '.' docdir = '.' if docdir.empty? ::File.join docdir, stylesdir end else ::File.join DATA_DIR, 'styles' end # TODO improve design/UX of custom theme functionality, including custom fonts resources do file 'styles/epub3.css' => (builder.postprocess_css_file ::File.join(workdir, 'epub3.css'), format) file 'styles/epub3-css3-only.css' => (builder.postprocess_css_file ::File.join(workdir, 'epub3-css3-only.css'), format) end resources do #file 'styles/epub3.css' => (builder.postprocess_css_file 'styles/epub3.css', format) #file 'styles/epub3-css3-only.css' => (builder.postprocess_css_file 'styles/epub3-css3-only.css', format) font_files, font_css = builder.select_fonts ::File.join(DATA_DIR, 'styles/epub3-fonts.css'), (doc.attr 'scripts', 'latin') file 'styles/epub3-fonts.css' => font_css with_media_type 'application/x-font-ttf' do font_files.each do |font_file| file font_file => ::File.join(DATA_DIR, font_file) end end end end def add_cover_image doc imagesdir = (doc.attr 'imagesdir', '.').chomp '/' imagesdir = (imagesdir == '.' ? nil : %(#{imagesdir}/)) if (front_cover_image = doc.attr 'front-cover-image') if front_cover_image =~ InlineImageMacroRx front_cover_image = %(#{imagesdir}#{$1}) end workdir = doc.attr 'docdir', '.' workdir = '.' if workdir.empty? else front_cover_image = DefaultCoverImage workdir = DATA_DIR end resources do cover_image %(#{imagesdir}jacket/cover#{::File.extname front_cover_image}) => ::File.join(workdir, front_cover_image) end end # NOTE must be called within the ordered block def add_cover_page doc, spine_builder, book imagesdir = (doc.attr 'imagesdir', '.').chomp '/' imagesdir = (imagesdir == '.' ? nil : %(#{imagesdir}/)) img = (doc.attr 'front-cover-image') || DefaultCoverImage if img =~ InlineImageMacroRx img = %(#{imagesdir}#{$1}) # TODO use proper attribute parser _, w, h = $2.split ',', 3 end w ||= 1050 h ||= 1600 img_path = %(#{imagesdir}jacket/cover#{::File.extname img}) # NOTE SVG wrapper maintains aspect ratio and confines image to view box content = %( #{sanitized_doctitle doc, :element_cdata} ).to_ios # GitDen expects a cover.xhtml, so add it to the spine spine_builder.file 'cover.xhtml' => content spine_builder.id 'cover' # clearly a deficiency of gepub that it does not match the id correctly book.spine.itemref_by_id['item_cover1'].idref = 'cover' end def add_images_from_front_matter if ::File.exist? 'front-matter.html' ::File.read('front-matter.html').scan(/ (builder.postprocess_xhtml_file 'front-matter.html', format) (spine_builder.instance_variable_get :@last_defined_item).properties << 'svg' end end # FIXME don't add same image more than once # FIXME add inline images def add_content_images doc, images docimagesdir = (doc.attr 'imagesdir', '.').chomp '/' docimagesdir = (docimagesdir == '.' ? nil : %(#{docimagesdir}/)) workdir = doc.attr 'docdir', '.' workdir = '.' if workdir.empty? resources workdir: workdir do images.each do |image| imagesdir = (image.document.attr 'imagesdir', '.').chomp '/' imagesdir = (imagesdir == '.' ? nil : %(#{imagesdir}/)) image_path = %(#{imagesdir}#{image.attr 'target'}) if image_path.start_with? %(#{docimagesdir}jacket/cover.) warn %(The image path #{image_path} is reserved for the cover artwork. Ignoring conflicting image from content.) elsif ::File.readable? image_path file image_path else warn %(Image not found or not readable: #{image_path}) end end end end def add_profile_images doc, usernames spine = @spine imagesdir = (doc.attr 'imagesdir', '.').chomp '/' imagesdir = (imagesdir == '.' ? nil : %(#{imagesdir}/)) resources do file %(#{imagesdir}avatars/default.jpg) => ::File.join(DATA_DIR, 'images/default-avatar.jpg') file %(#{imagesdir}headshots/default.jpg) => ::File.join(DATA_DIR, 'images/default-headshot.jpg') end workdir = doc.attr 'docdir', '.' workdir = '.' if workdir.empty? resources do usernames.each do |username| avatar = %(#{imagesdir}avatars/#{username}.jpg) if ::File.readable?(resolved_avatar = ::File.join(workdir, avatar)) file avatar => resolved_avatar else warn %(Avatar #{avatar} not found or readable. Falling back to default avatar for #{username}.) file avatar => ::File.join(DATA_DIR, 'images/default-avatar.jpg') end headshot = %(#{imagesdir}headshots/#{username}.jpg) if ::File.readable?(resolved_headshot = ::File.join(workdir, headshot)) file headshot => resolved_headshot elsif doc.attr? 'builder', 'editions' warn %(Headshot #{headshot} not found or readable. Falling back to default headshot for #{username}.) file headshot => ::File.join(DATA_DIR, 'images/default-headshot.jpg') end end =begin spine.each do |item| username = (item.attr 'username') || 'default' avatar_target = %(#{imagesdir}avatars/#{username}.jpg) if ::File.readable?(avatar = %(#{item.attr 'docname'}/avatar.jpg)) file avatar_target => avatar else warn %(Avatar #{avatar} not found or not readable. Falling back to default avatar for #{username}.) ::Dir.chdir DATA_DIR do file avatar_target => %(images/default-avatar.jpg) end end if ::File.readable? (headshot = %(#{item.attr 'docname'}/headshot.jpg)) file headshot # TODO default headshot? end end =end end end def add_content doc builder = self spine = @spine format = @format workdir = doc.attr 'docdir', '.' workdir = '.' if workdir.empty? resources workdir: workdir do builder.add_images_from_front_matter # QUESTION should we move navigation_document to the Packager class? seems to make sense #nav 'nav.xhtml' => (builder.postprocess_xhtml doc.converter.navigation_document(doc, spine), format) nav 'nav.xhtml' => (builder.postprocess_xhtml ::Asciidoctor::Converter::Factory.default.create('epub3-xhtml5').navigation_document(doc, spine), format) ordered do builder.add_cover_page doc, self, @book unless format == :kf8 builder.add_front_matter_page doc, self, builder, format spine.each_with_index do |item, i| content_path = %(#{item.id || (item.attr 'docname')}.xhtml) file content_path => (builder.postprocess_xhtml item.convert, format) # NOTE heading for ePub2 navigation file; toc.ncx requires headings to be plain text heading builder.sanitized_doctitle(item) @last_defined_item.properties << 'svg' if ((item.attr 'epub-properties') || []).include? 'svg' #linear 'yes' if i == 0 end end end end def collect_keywords doc, spine ([doc] + spine).map do |item| if item.attr? 'keywords' (item.attr 'keywords').split CsvDelimiterRx else [] end end.flatten.uniq end # Swap fonts in CSS based on the value of the document attribute 'scripts', # then return the list of fonts as well as the font CSS. def select_fonts filename, scripts = 'latin' font_css = ::File.read(filename) font_css = font_css.gsub(/(?<=-)latin(?=\.ttf\))/, scripts) unless scripts == 'latin' font_list = font_css.scan(/url\(\.\.\/(.+\.ttf)\);$/).flatten return [font_list, font_css.to_ios] end def postprocess_css_file filename, format return filename unless format == :kf8 postprocess_css ::File.read(filename), format end def postprocess_css content, format return content.to_ios unless format == :kf8 # TODO convert regular expressions to constants content .gsub(/^ -webkit-column-break-.*\n/, '') .gsub(/^ max-width: .*\n/, '') .to_ios end def postprocess_xhtml_file filename, format return filename unless format == :kf8 postprocess_xhtml ::File.read(filename), format end # NOTE Kindle requires that # # be converted to # def postprocess_xhtml content, format return content.to_ios unless format == :kf8 # TODO convert regular expressions to constants content .gsub(//, '') .gsub(/]+) style="width: (\d\d)%;"/, '.*?<\/script>\n?/m, '') .to_ios end end class Packager KINDLEGEN = ENV['KINDLEGEN'] || 'kindlegen' EPUBCHECK = ENV['EPUBCHECK'] || %(epubcheck#{::Gem.win_platform? ? '.bat' : '.sh'}) EpubExtensionRx = /\.epub$/ Kf8ExtensionRx = /-kf8\.epub$/ def initialize spine_doc, spine, format = :epub3, options = {} @document = spine_doc @spine = spine || [] @format = format end def package options = {} doc = @document spine = @spine fmt = @format dest = @dest_dir = options[:to_dir] || (File.expand_path ::Dir.pwd) images = spine.map {|item| (item.find_by context: :image) || [] }.flatten usernames = spine.map {|item| item.attr 'username' }.compact.uniq # FIXME authors should be aggregated already on parent document authors = if doc.attr? 'authors' (doc.attr 'authors').split(GepubBuilderMixin::CsvDelimiterRx).concat(spine.map {|item| item.attr 'author' }).uniq else [] end builder = ::GEPUB::Builder.new do extend GepubBuilderMixin @document = doc @spine = spine @format = fmt @book.epub_backward_compat = (fmt != :kf8) language(doc.attr 'lang', 'en') id 'pub-language' if doc.attr? 'uuid' unique_identifier doc.attr('uuid'), 'pub-identifier', 'uuid' else unique_identifier doc.id, 'pub-identifier', 'uuid' end # replace with next line once the attributes argument is supported #unique_identifier doc.id, 'pub-id', 'uuid', 'scheme' => 'xsd:string' title sanitized_doctitle(doc) id 'pub-title' # FIXME this logic needs some work if doc.attr? 'publisher' publisher(publisher_name = doc.attr('publisher')) # marc role: Book producer (see http://www.loc.gov/marc/relators/relaterm.html) creator doc.attr('producer', publisher_name), 'bkp' else # NOTE Use producer as both publisher and producer if publisher isn't specified if doc.attr? 'producer' producer_name = doc.attr 'producer' publisher producer_name # marc role: Book producer (see http://www.loc.gov/marc/relators/relaterm.html) creator producer_name, 'bkp' # NOTE Use author as creator if both publisher or producer are absent elsif doc.attr? 'author' # marc role: Author (see http://www.loc.gov/marc/relators/relaterm.html) creator doc.attr('author'), 'aut' end end if doc.attr? 'creator' # marc role: Creator (see http://www.loc.gov/marc/relators/relaterm.html) creator doc.attr('creator'), 'cre' else # marc role: Manufacturer (see http://www.loc.gov/marc/relators/relaterm.html) # QUESTION should this be bkp? creator 'Asciidoctor', 'mfr' end # TODO getting author list should be a method on Asciidoctor API contributors(*authors) if doc.attr? 'revdate' # TODO ensure this is a real date date(doc.attr 'revdate') else date ::Time.now.strftime('%Y-%m-%dT%H:%M:%SZ') end if doc.attr? 'description' description(doc.attr 'description') end (collect_keywords doc, spine).each do |s| subject s end if doc.attr? 'source' source(doc.attr 'source') end if doc.attr? 'copyright' rights(doc.attr 'copyright') end #add_metadata 'ibooks:specified-fonts', true add_theme_assets doc add_cover_image doc add_profile_images doc, usernames # QUESTION move add_content_images to add_content method? add_content_images doc, images add_content doc end ::FileUtils.mkdir_p dest unless ::File.directory? dest epub_file = ::File.expand_path %(#{doc.attr 'docname'}#{fmt == :kf8 ? '-kf8' : nil}.epub), dest builder.generate_epub epub_file puts %(Wrote #{fmt.upcase} to #{epub_file}) if options[:extract] extract_dir = epub_file.sub EpubExtensionRx, '' ::FileUtils.remove_dir extract_dir if ::File.directory? extract_dir ::Dir.mkdir extract_dir ::Dir.chdir extract_dir do ::Zip::File.open epub_file do |entries| entries.each do |entry| next unless entry.file? unless (entry_dir = ::File.dirname entry.name) == '.' || (::File.directory? entry_dir) ::FileUtils.mkdir_p entry_dir end entry.extract end end end puts %(Extracted #{fmt.upcase} to #{extract_dir}) end if fmt == :kf8 distill_epub_to_mobi epub_file elsif options[:validate] validate_epub epub_file end end # QUESTION how to enable the -c2 flag? (enables ~3-5% compression) def distill_epub_to_mobi epub_file kindlegen_cmd = KINDLEGEN unless ::File.executable? kindlegen_cmd require 'kindlegen' unless defined? ::Kindlegen kindlegen_cmd = ::Kindlegen.command end mobi_file = ::File.basename(epub_file).sub Kf8ExtensionRx, '.mobi' ::Open3.popen2e(::Shellwords.join [kindlegen_cmd, '-o', mobi_file, epub_file]) {|input, output, wait_thr| output.each {|line| puts line } } puts %(Wrote MOBI to #{::File.join ::File.dirname(epub_file), mobi_file}) end def validate_epub epub_file epubcheck_cmd = EPUBCHECK unless ::File.executable? epubcheck_cmd epubcheck_cmd = ::Gem.bin_path 'epubcheck', 'epubcheck' end # NOTE epubcheck gem doesn't support epubcheck command options; enable -quiet once supported ::Open3.popen2e(::Shellwords.join [epubcheck_cmd, epub_file]) {|input, output, wait_thr| output.each {|line| puts line } } end end end end