Sha256: 020885d9c15fcac890181ac97392291c1b41186f7af1bfeb25a1b603fbb36419

Contents?: true

Size: 1.54 KB

Versions: 12

Compression:

Stored size: 1.54 KB

Contents

module Metanorma
  module Standoc
    module Cleanup
      # Indices sort after letter but before any following
      # letter (x, x_m, x_1, xa); we use colon to force that sort order.
      # Numbers sort *after* letters; we use thorn to force that sort order.
      def symbol_key(sym)
        key = sym.dup
        key.traverse do |n|
          n.name == "math" and
            n.replace(grkletters(MathML2AsciiMath.m2a(n.to_xml)))
        end
        ret = Nokogiri::XML(key.to_xml)
        @c.decode(ret.text.downcase)
          .gsub(/[\[\]{}<>()]/, "").gsub(/\s/m, "")
          .gsub(/[[:punct:]]|[_^]/, ":\\0").gsub(/`/, "")
          .gsub(/[0-9]+/, "รพ\\0")
      end

      def grkletters(text)
        text.gsub(/\b(alpha|beta|gamma|delta|epsilon|zeta|eta|theta|iota|kappa|
                      lambda|mu|nu|xi|omicron|pi|rho|sigma|tau|upsilon|phi|chi|
                      psi|omega)\b/xi, "&\\1;")
      end

      def extract_symbols_list(dlist)
        dl_out = []
        dlist.xpath("./dt | ./dd").each do |dtd|
          if dtd.name == "dt"
            dl_out << { dt: dtd.remove, key: symbol_key(dtd) }
          else
            dl_out.last[:dd] = dtd.remove
          end
        end
        dl_out
      end

      def symbols_cleanup(docxml)
        docxml.xpath("//definitions/dl").each do |dl|
          dl_out = extract_symbols_list(dl)
          dl_out.sort! { |a, b| a[:key] <=> b[:key] || a[:dt] <=> b[:dt] }
          dl.children = dl_out.map { |d| d[:dt].to_s + d[:dd].to_s }.join("\n")
        end
        docxml
      end
    end
  end
end

Version data entries

12 entries across 12 versions & 1 rubygems

Version Path
metanorma-standoc-2.2.6 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.5 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.4 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.3.1 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.3 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.2.2 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.2.1 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.2 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.1.1 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.1 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.0.1 lib/metanorma/standoc/cleanup_symbols.rb
metanorma-standoc-2.2.0 lib/metanorma/standoc/cleanup_symbols.rb