require "metanorma-standoc" require_relative "./validate_style" require_relative "./validate_requirements" require_relative "./validate_section" require_relative "./validate_title" require_relative "./validate_image" require_relative "./validate_list" require "nokogiri" require "jing" require "iev" module Metanorma module ISO class Converter < Standoc::Converter def isosubgroup_validate(root) root.xpath("//technical-committee/@type").each do |t| unless %w{TC PC JTC JPC}.include? t.text @log.add("Document Attributes", nil, "invalid technical committee type #{t}") end end root.xpath("//subcommittee/@type").each do |t| unless %w{SC JSC}.include? t.text @log.add("Document Attributes", nil, "invalid subcommittee type #{t}") end end end # ISO/IEC DIR 2, 15.5.3, 20.2 # does not deal with preceding text marked up def see_xrefs_validate(root) @lang == "en" or return root.xpath("//xref").each do |t| preceding = t.at("./preceding-sibling::text()[last()]") next unless !preceding.nil? && /\b(see| refer to)\p{Zs}*\Z/mi.match(preceding) (target = root.at("//*[@id = '#{t['target']}']")) || next target.at("./ancestor-or-self::*[@obligation = 'normative']") && !target.at("./ancestor::sections") and @log.add("Style", t, "'see #{t['target']}' is pointing to a normative section") end end # ISO/IEC DIR 2, 15.5.3 def see_erefs_validate(root) @lang == "en" or return root.xpath("//eref").each do |t| prec = t.at("./preceding-sibling::text()[last()]") next unless !prec.nil? && /\b(see|refer to)\p{Zs}*\Z/mi.match(prec) unless target = root.at("//*[@id = '#{t['bibitemid']}']") @log.add("Bibliography", t, "'#{t} is not pointing to a real reference") next end target.at("./ancestor::references[@normative = 'true']") and @log.add("Style", t, "'see #{t}' is pointing to a normative reference") end end # ISO/IEC DIR 2, 10.4 def locality_erefs_validate(root) root.xpath("//eref[descendant::locality]").each do |t| if /^(ISO|IEC)/.match?(t["citeas"]) && !/: ?(\d+{4}|–)$/.match?(t["citeas"]) @log.add("Style", t, "undated reference #{t['citeas']} should not contain " \ "specific elements") end end end def termdef_warn(text, regex, elem, term, msg) regex.match(text) && @log.add("Style", elem, "#{term}: #{msg}") end # https://www.iso.org/ISO-house-style.html#iso-hs-s-text-r-r-ref_clause3 def term_xrefs_validate(xmldoc) termids = xmldoc .xpath("//sections/terms | //sections/clause[.//terms] | " \ "//annex[.//terms]").each_with_object({}) do |t, m| t.xpath(".//*/@id").each { |a| m[a.text] = true } t.name == "terms" and m[t["id"]] = true end xmldoc.xpath(".//xref").each do |x| term_xrefs_validate1(x, termids) end end def term_xrefs_validate1(xref, termids) closest_id = xref.xpath("./ancestor::*[@id]")&.last or return (termids[xref["target"]] && !termids[closest_id["id"]]) and @log.add("Style", xref, "only terms clauses can cross-reference terms clause " \ "(#{xref['target']})") (!termids[xref["target"]] && termids[closest_id["id"]]) and @log.add("Style", xref, "non-terms clauses cannot cross-reference terms clause " \ "(#{xref['target']})") end # ISO/IEC DIR 2, 16.5.6 def termdef_style(xmldoc) xmldoc.xpath("//term").each do |t| para = t.at("./definition/verbal-definition") || return term = t.at("./preferred//name").text @lang == "en" and termdef_warn(para.text, /\A(the|a)\b/i, t, term, "term definition starts with article") %(Cyrl Latn).include?(@script) and termdef_warn(para.text, /\.\Z/i, t, term, "term definition ends with period") end end def doctype_validate(xmldoc) doctype = xmldoc&.at("//bibdata/ext/doctype")&.text %w(international-standard technical-specification technical-report publicly-available-specification international-workshop-agreement guide amendment technical-corrigendum).include? doctype or @log.add("Document Attributes", nil, "#{doctype} is not a recognised document type") end def script_validate(xmldoc) script = xmldoc&.at("//bibdata/script")&.text %w(Cyrl Latn).include?(script) or @log.add("Document Attributes", nil, "#{script} is not a recognised script") end def iteration_validate(xmldoc) iteration = xmldoc&.at("//bibdata/status/iteration")&.text or return /^\d+/.match(iteration) or @log.add("Document Attributes", nil, "#{iteration} is not a recognised iteration") end def bibdata_validate(doc) doctype_validate(doc) script_validate(doc) iteration_validate(doc) end def content_validate(doc) super title_validate(doc.root) isosubgroup_validate(doc.root) onlychild_clause_validate(doc.root) termdef_style(doc.root) see_xrefs_validate(doc.root) term_xrefs_validate(doc.root) see_erefs_validate(doc.root) locality_erefs_validate(doc.root) bibdata_validate(doc.root) bibitem_validate(doc.root) figure_validate(doc.root) listcount_validate(doc) list_punctuation(doc) end def bibitem_validate(xmldoc) xmldoc.xpath("//bibitem[date/on = '–']").each do |b| b.at("./note[@type = 'Unpublished-Status']") or @log.add("Style", b, "Reference #{b&.at('./@id')&.text} does not have an " \ "associated footnote indicating unpublished status") end end def validate(doc) content_validate(doc) doctype = doc&.at("//bibdata/ext/doctype")&.text schema = case doctype when "amendment", "technical-corrigendum" # @amd "isostandard-amd.rng" else "isostandard-compile.rng" end schema_validate(formattedstr_strip(doc.dup), File.join(File.dirname(__FILE__), schema)) end end end end