require "date"
require "nokogiri"
require "htmlentities"
require "json"
require "pathname"
require "open-uri"
module Asciidoctor
module ISO
class Converter < Standoc::Converter
PRE_NORMREF_FOOTNOTES = "//preface//fn | "\
"//clause[@type = 'scope']//fn".freeze
NORMREF_FOOTNOTES =
"//references[@normative = 'true']//fn".freeze
POST_NORMREF_FOOTNOTES =
"//sections//clause[not(@type = 'scope')]//fn | "\
"//annex//fn | "\
"//references[@normative = 'false']//fn".freeze
def other_footnote_renumber(xmldoc)
seen = {}
i = 0
xmldoc.xpath(PRE_NORMREF_FOOTNOTES).each do |fn|
i, seen = other_footnote_renumber1(fn, i, seen)
end
xmldoc.xpath(NORMREF_FOOTNOTES).each do |fn|
i, seen = other_footnote_renumber1(fn, i, seen)
end
xmldoc.xpath(POST_NORMREF_FOOTNOTES).each do |fn|
i, seen = other_footnote_renumber1(fn, i, seen)
end
end
def id_prefix(prefix, id)
return id.text if @amd # we're just inheriting the prefixes from parent doc
prefix.join("/") + ( id.text.match(%{^/}) ? "" : " " ) + id.text
end
def get_id_prefix(xmldoc)
prefix = []
xmldoc.xpath("//bibdata/contributor[role/@type = 'publisher']"\
"/organization").each do |x|
x1 = x.at("abbreviation")&.text || x.at("name")&.text
x1 == "ISO" and prefix.unshift("ISO") or prefix << x1
end
prefix
end
# ISO as a prefix goes first
def docidentifier_cleanup(xmldoc)
prefix = get_id_prefix(xmldoc)
id = xmldoc.at("//bibdata/docidentifier[@type = 'ISO']") or return
id.content = id_prefix(prefix, id)
id = xmldoc.at("//bibdata/ext/structuredidentifier/project-number") and
id.content = id_prefix(prefix, id)
id = xmldoc.at("//bibdata/docidentifier[@type = 'iso-with-lang']") and
id.content = id_prefix(prefix, id)
id = xmldoc.at("//bibdata/docidentifier[@type = 'iso-reference']") and
id.content = id_prefix(prefix, id)
end
def format_ref(ref, type)
ref = ref.sub(/ \(All Parts\)/i, "")
super
end
TERM_CLAUSE = "//sections//terms".freeze
PUBLISHER = "./contributor[role/@type = 'publisher']/organization".freeze
OTHERIDS = "@type = 'DOI' or @type = 'metanorma' or @type = 'ISSN' or "\
"@type = 'ISBN'".freeze
def pub_class(bib)
return 1 if bib.at("#{PUBLISHER}[abbreviation = 'ISO']")
return 1 if bib.at("#{PUBLISHER}[name = 'International Organization "\
"for Standardization']")
return 2 if bib.at("#{PUBLISHER}[abbreviation = 'IEC']")
return 2 if bib.at("#{PUBLISHER}[name = 'International "\
"Electrotechnical Commission']")
return 3 if bib.at("./docidentifier[@type][not(#{OTHERIDS})]")
4
end
def sort_biblio(bib)
bib.sort do |a, b|
sort_biblio_key(a) <=> sort_biblio_key(b)
end
end
# TODO sort by authors
# sort by: doc class (ISO, IEC, other standard (not DOI &c), other
# then standard class (docid class other than DOI &c)
# then docnumber if present, numeric sort
# else alphanumeric metanorma id (abbreviation)
# then doc part number if present, numeric sort
# then doc id (not DOI &c)
# then title
def sort_biblio_key(bib)
pubclass = pub_class(bib)
num = bib&.at("./docnumber")&.text
id = bib&.at("./docidentifier[not(#{OTHERIDS})]")
metaid = bib&.at("./docidentifier[@type = 'metanorma']")&.text
abbrid = metaid unless /^\[\d+\]$/.match(metaid)
/\d-(?\d+)/ =~ id&.text
type = id['type'] if id
title = bib&.at("./title[@type = 'main']")&.text ||
bib&.at("./title")&.text || bib&.at("./formattedref")&.text
"#{pubclass} :: #{type} :: "\
"#{num.nil? ? abbrid : sprintf("%09d", num.to_i)} :: "\
"#{partid} :: #{id&.text} :: #{title}"
end
def sections_cleanup(x)
super
return unless @amd
x.xpath("//*[@inline-header]").each do |h|
h.delete('inline-header')
end
end
def boilerplate_file(xmldoc)
file = @lang == "fr" ? "boilerplate-fr.xml" : "boilerplate.xml"
File.join(@libdir, file)
end
def footnote_cleanup(xmldoc)
unpub_footnotes(xmldoc)
super
end
def unpub_footnotes(xmldoc)
xmldoc.xpath("//bibitem/note[@type = 'Unpublished-Status']").each do |n|
id = n.parent["id"]
e = xmldoc.at("//eref[@bibitemid = '#{id}']") or next
e.next = n.dup
e.next.name = "fn"
e.next.delete("format")
e.next.delete("type")
end
end
def bibitem_cleanup(xmldoc)
super
unpublished_note(xmldoc)
end
def unpublished_note(xmldoc)
xmldoc.xpath("//bibitem[not(note[@type = 'Unpublished-Status'])]").each do |b|
next if pub_class(b) > 2
next unless s = b.at("./status/stage") and s.text.to_i < 60
id = b.at("docidentifier").text
b.at("./language | ./script | ./abstract | ./status").previous = <<~NOTE