Sha256: c38f8b56dec75148f426415183a21fba1a4a66060669fa8b95584be621305023

Contents?: true

Size: 1.95 KB

Versions: 8

Compression:

Stored size: 1.95 KB

Contents

module Nokogiri
  module XML
    class FragmentHandler < Nokogiri::XML::SAX::Document # :nodoc:
      def initialize node, original_html
        @doc_started    = false
        @document       = node.document
        @stack          = [node]
        @klass          = if node.kind_of?(Nokogiri::HTML::DocumentFragment)
                            Nokogiri::HTML::DocumentFragment
                          else
                            Nokogiri::XML::DocumentFragment
                          end
        #
        # the regexes used in start_element() and characters() anchor at
        # start-of-line, but we really only want them to anchor at
        # start-of-doc. so let's only save up to the first newline.
        #
        # this implementation choice was the result of some benchmarks, if
        # you're curious: http://gist.github.com/115936
        #
        newline_index = original_html.index("\n")
        @original_html = if newline_index
                           original_html[0,newline_index]
                         else
                           original_html
                         end
      end

      def start_element name, attrs = []
        regex = (@klass == Nokogiri::HTML::DocumentFragment) ? %r{^\s*<#{Regexp.escape(name)}}i \
                                                             : %r{^\s*<#{Regexp.escape(name)}}
        @doc_started = true if @original_html =~ regex
        return unless @doc_started

        node = Node.new(name, @document)
        attrs << "" unless (attrs.length % 2) == 0
        Hash[*attrs].each do |k,v|
          node[k] = v
        end
        @stack.last << node
        @stack << node
      end

      def characters string
        @doc_started = true if @original_html.strip =~ %r{^\s*#{Regexp.escape(string.strip)}}
        @stack.last << Nokogiri::XML::Text.new(string, @document)
      end

      def end_element name
        return unless @stack.last.name == name
        @stack.pop
      end
    end
  end
end

Version data entries

8 entries across 8 versions & 1 rubygems

Version Path
nokogiri-1.3.0-x86-mingw32 lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.0-java lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.0-x86-mswin32 lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.1-java lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.0 lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.1-x86-mingw32 lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.1-x86-mswin32 lib/nokogiri/xml/fragment_handler.rb
nokogiri-1.3.1 lib/nokogiri/xml/fragment_handler.rb