Sha256: 9a063c38479cff9a80962f722068a6a74fc7d95997cb4f5dabe032db73a5d4e1

Contents?: true

Size: 1.79 KB

Versions: 5

Compression:

Stored size: 1.79 KB

Contents

module Boilerpipe::SAX
  class TagActionMap
    def self.tag_actions
      labels = ::Boilerpipe::Labels
      {
        STYLE: TagActions::IgnorableElement.new,
        SCRIPT: TagActions::IgnorableElement.new,
        OPTION: TagActions::IgnorableElement.new,
        OBJECT: TagActions::IgnorableElement.new,
        EMBED: TagActions::IgnorableElement.new,
        APPLET: TagActions::IgnorableElement.new,
        LINK: TagActions::IgnorableElement.new,

        A: TagActions::AnchorText.new,
        BODY: TagActions::Body.new,

        STRIKE: TagActions::InlineNoWhitespace.new,
        U: TagActions::InlineNoWhitespace.new,
        B: TagActions::InlineNoWhitespace.new,
        I: TagActions::InlineNoWhitespace.new,
        EM: TagActions::InlineNoWhitespace.new,
        STRONG: TagActions::InlineNoWhitespace.new,
        SPAN: TagActions::InlineNoWhitespace.new,

        # New in 1.1 (especially to improve extraction quality from Wikipedia etc.)
        SUP: TagActions::InlineNoWhitespace.new,

        # New in 1.2
        CODE: TagActions::InlineNoWhitespace.new,
        TT: TagActions::InlineNoWhitespace.new,
        SUB: TagActions::InlineNoWhitespace.new,
        VAR: TagActions::InlineNoWhitespace.new,

        ABBR: TagActions::InlineWhitespace.new,
        ACRONYM: TagActions::InlineWhitespace.new,
        FONT: TagActions::InlineNoWhitespace.new,

        # added in 1.1.1
        NOSCRIPT: TagActions::IgnorableElement.new,

        # New in 1.3

        LI: TagActions::BlockTagLabel.new(labels::LabelAction.new([:LI])),
        H1: TagActions::BlockTagLabel.new(labels::LabelAction.new([:H1, :HEADING])),
        H2: TagActions::BlockTagLabel.new(labels::LabelAction.new([:H2, :HEADING])),
        H3: TagActions::BlockTagLabel.new(labels::LabelAction.new([:H3, :HEADING]))
      }
    end
  end
end

Version data entries

5 entries across 5 versions & 1 rubygems

Version Path
boilerpipe-ruby-0.5.0 lib/boilerpipe/sax/tag_action_map.rb
boilerpipe-ruby-0.4.4 lib/boilerpipe/sax/tag_action_map.rb
boilerpipe-ruby-0.4.3 lib/boilerpipe/sax/tag_action_map.rb
boilerpipe-ruby-0.4.2 lib/boilerpipe/sax/tag_action_map.rb
boilerpipe-ruby-0.4.1 lib/boilerpipe/sax/tag_action_map.rb