require "fileutils" require "nokogiri" require "htmlentities" require "yaml" require "fontist" require "fontist/manifest/install" require_relative "compile_validate" require_relative "fontist_utils" module Metanorma class Compile # @return [Array] attr_reader :errors, :processor def initialize @registry = Metanorma::Registry.instance @errors = [] end def compile(filename, options = {}) require_libraries(options) options = options_extract(filename, options) validate_options(options) @processor = @registry.find_processor(options[:type].to_sym) extensions = get_extensions(options) or return nil (file, isodoc = process_input(filename, options)) or return nil relaton_export(isodoc, options) extract(isodoc, options[:extract], options[:extract_type]) FontistUtils.install_fonts(@processor, options) process_extensions(extensions, file, isodoc, options) end def require_libraries(options) options&.dig(:require)&.each { |r| require r } end def xml_options_extract(file) xml = Nokogiri::XML(file) if xml.root @registry.root_tags.each do |k, v| return { type: k } if v == xml.root.name end end {} end def options_extract(filename, options) content = read_file(filename) o = Metanorma::Input::Asciidoc.new.extract_metanorma_options(content) o = o.merge(xml_options_extract(content)) options[:type] ||= o[:type]&.to_sym t = @registry.alias(options[:type]) and options[:type] = t dir = filename.sub(%r(/[^/]+$), "/") options[:relaton] ||= "#{dir}/#{o[:relaton]}" if o[:relaton] options[:sourcecode] ||= "#{dir}/#{o[:sourcecode]}" if o[:sourcecode] options[:extension_keys] ||= o[:extensions]&.split(/,[ ]*/)&.map(&:to_sym) options[:extension_keys] = nil if options[:extension_keys] == [:all] options[:format] ||= :asciidoc options[:filename] = filename options end def get_extensions(options) options[:extension_keys] ||= @processor.output_formats.reduce([]) do |memo, (k, _)| memo << k end extensions = options[:extension_keys].reduce([]) do |memo, e| if @processor.output_formats[e] memo << e else message = "[metanorma] Error: #{e} format is not supported for this standard." @errors << message Util.log(message, :error) memo end end if !extensions.include?(:presentation) and extensions.any? { |e| @processor.use_presentation_xml(e) } extensions << :presentation end extensions end def process_input(filename, options) case extname = File.extname(filename) when ".adoc" Util.log("[metanorma] Processing: AsciiDoc input.", :info) file = read_file(filename) options[:asciimath] and file.sub!(/^(=[^\n]+\n)/, "\\1:mn-keep-asciimath:\n") dir = File.dirname(filename) dir != '.' and file.gsub!(/^include::/, "include::#{dir}/") [file, @processor.input_to_isodoc(file, filename, options)] when ".xml" Util.log("[metanorma] Processing: Metanorma XML input.", :info) # TODO NN: this is a hack -- we should provide/bridge the # document attributes in Metanorma XML ["", read_file(filename)] else Util.log("[metanorma] Error: file extension #{extname} is not supported.", :error) nil end end def read_file(filename) File.read(filename, encoding: "utf-8").gsub("\r\n", "\n") end def relaton_export(isodoc, options) return unless options[:relaton] xml = Nokogiri::XML(isodoc) bibdata = xml.at("//bibdata") || xml.at("//xmlns:bibdata") #docid = bibdata&.at("./xmlns:docidentifier")&.text || options[:filename] #outname = docid.sub(/^\s+/, "").sub(/\s+$/, "").gsub(/\s+/, "-") + ".xml" File.open(options[:relaton], "w:UTF-8") { |f| f.write bibdata.to_xml } end def clean_sourcecode(xml) xml.xpath(".//callout | .//annotation | .//xmlns:callout | .//xmlns:annotation").each do |x| x.remove end xml.xpath(".//br | .//xmlns:br").each { |x| x.replace("\n") } HTMLEntities.new.decode(xml.children.to_xml) end def extract(isodoc, dirname, extract_types) return unless dirname if extract_types.nil? || extract_types.empty? extract_types = [:sourcecode, :image, :requirement] end FileUtils.rm_rf dirname FileUtils.mkdir_p dirname xml = Nokogiri::XML(isodoc) sourcecode_export(xml, dirname) if extract_types.include? :sourcecode image_export(xml, dirname) if extract_types.include? :image requirement_export(xml, dirname) if extract_types.include? :requirement end def sourcecode_export(xml, dirname) xml.at("//sourcecode | //xmlns:sourcecode") or return FileUtils.mkdir_p "#{dirname}/sourcecode" xml.xpath("//sourcecode | //xmlns:sourcecode").each_with_index do |s, i| filename = s["filename"] || sprintf("sourcecode-%04d.txt", i) File.open("#{dirname}/sourcecode/#{filename}", "w:UTF-8") do |f| f.write clean_sourcecode(s.dup) end end end def image_export(xml, dirname) xml.at("//image | //xmlns:image") or return FileUtils.mkdir_p "#{dirname}/image" xml.xpath("//image | //xmlns:image").each_with_index do |s, i| next unless /^data:image/.match s["src"] %r{^data:image/(?[^;]+);base64,(?.+)$} =~ s["src"] filename = s["filename"] || sprintf("image-%04d.%s", i, imgtype) File.open("#{dirname}/image/#{filename}", "wb") do |f| f.write(Base64.strict_decode64(imgdata)) end end end REQUIREMENT_XPATH = "//requirement | //xmlns:requirement | "\ "//recommendation | //xmlns:recommendation | //permission | "\ "//xmlns:permission".freeze def requirement_export(xml, dirname) xml.at(REQUIREMENT_XPATH) or return FileUtils.mkdir_p "#{dirname}/requirement" xml.xpath(REQUIREMENT_XPATH).each_with_index do |s, i| filename = s["filename"] || sprintf("%s-%04d.xml", s.name, i) File.open("#{dirname}/requirement/#{filename}", "w:UTF-8") do |f| f.write s end end end # dependency ordering def sort_extensions_execution(ext) case ext when :xml then 0 when :rxl then 1 when :presentation then 2 else 99 end end def wrap_html(options, file_extension, outfilename) if options[:wrapper] && /html$/.match(file_extension) outfilename = outfilename.sub(/\.html$/, "") FileUtils.mkdir_p outfilename FileUtils.mv "#{outfilename}.html", outfilename FileUtils.mv "#{outfilename}_images", outfilename, force: true end end # isodoc is Raw Metanorma XML def process_extensions(extensions, file, isodoc, options) f = change_output_dir options xml_name = f.sub(/\.[^.]+$/, ".xml") presentationxml_name = f.sub(/\.[^.]+$/, ".presentation.xml") extensions.sort do |a, b| sort_extensions_execution(a) <=> sort_extensions_execution(b) end.each do |ext| isodoc_options = @processor.extract_options(file) isodoc_options[:datauriimage] = true if options[:datauriimage] isodoc_options[:sourcefilename] = options[:filename] file_extension = @processor.output_formats[ext] outfilename = f.sub(/\.[^.]+$/, ".#{file_extension}") if ext == :pdf font_locations = FontistUtils.fontist_font_locations(@processor, options) font_locations and isodoc_options[:mn2pdf] = { font_manifest_file: font_locations.path } end if ext == :rxl options[:relaton] = outfilename relaton_export(isodoc, options) else begin @processor.use_presentation_xml(ext) ? @processor.output(nil, presentationxml_name, outfilename, ext, isodoc_options) : @processor.output(isodoc, xml_name, outfilename, ext, isodoc_options) rescue StandardError => e if e.message.include? "Fatal:" @errors << e.message else puts e.message puts e.backtrace.join("\n") end end end wrap_html(options, file_extension, outfilename) end end private # @param options [Hash] # @return [String] def change_output_dir(options) if options[:output_dir] File.join options[:output_dir], File.basename(options[:filename]) else options[:filename] end end end end