Sha256: cc881604d14899d9f37680abe77f217e360caf77d4b04360f6b029fd396005a6

Contents?: true

Size: 1.75 KB

Versions: 8

Compression:

Stored size: 1.75 KB

Contents

# frozen_string_literal: true

module Asciidoctor
  module PDF
    module Sanitizer
      XMLSpecialChars = {
        '&lt;' => '<',
        '&gt;' => '>',
        '&amp;' => '&',
      }
      XMLSpecialCharsRx = /&(?:[lg]t|amp);/
      InverseXMLSpecialChars = XMLSpecialChars.invert
      InverseXMLSpecialCharsRx = /[#{InverseXMLSpecialChars.keys.join}]/
      (BuiltInNamedEntities = {
        'amp' => '&',
        'apos' => ?',
        'gt' => '>',
        'lt' => '<',
        'nbsp' => ' ',
        'quot' => '"',
      }).default = '?'
      SanitizeXMLRx = /<[^>]+>/
      CharRefRx = /&(?:amp;)?(?:([a-z][a-z]+\d{0,2})|#(?:(\d\d\d{0,4})|x(\h\h\h{0,3})));/
      UnescapedAmpersandRx = /&(?!(?:[a-z][a-z]+\d{0,2}|#(?:\d\d\d{0,4}|x\h\h\h{0,3}));)/

      # Strip leading, trailing and repeating whitespace, remove XML tags and
      # resolve all entities in the specified string.
      #
      # FIXME: move to a module so we can mix it in elsewhere
      # FIXME: add option to control escaping entities, or a filter mechanism in general
      def sanitize string, compact: true
        string = string.gsub SanitizeXMLRx, '' if string.include? '<'
        string = string.gsub(CharRefRx) { $1 ? BuiltInNamedEntities[$1] : ([$2 ? $2.to_i : ($3.to_i 16)].pack 'U1') } if string.include? '&'
        compact ? (string.strip.tr_s ' ', ' ') : string
      end

      def escape_xml string
        string.gsub InverseXMLSpecialCharsRx, InverseXMLSpecialChars
      end

      def unescape_xml string
        string.gsub XMLSpecialCharsRx, XMLSpecialChars
      end

      def escape_amp string
        string.gsub UnescapedAmpersandRx, '&amp;'
      end

      def encode_quotes string
        (string.include? '"') ? (string.gsub '"', '&quot;') : string
      end
    end
  end
end

Version data entries

8 entries across 8 versions & 1 rubygems

Version Path
asciidoctor-pdf-2.3.7 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.6 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.5 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.4 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.3 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.2 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.1 lib/asciidoctor/pdf/sanitizer.rb
asciidoctor-pdf-2.3.0 lib/asciidoctor/pdf/sanitizer.rb