Sha256: a7f4c69fb81737b4cf98a541d44c4a62cd8d4cdf76eef4e295d014ba41802827

Contents?: true

Size: 691 Bytes

Versions: 6

Compression:

Stored size: 691 Bytes

Contents

#!/usr/bin/ruby
require 'rubygems'
require 'muddyit_fu'
require 'rss'
require 'open-uri'

# Connect to Muddy
muddyit =  Muddyit.new('./config.yml')
collection= muddyit.collections.find(:all).first
# Parse RSS
rss_content = ''
open('http://newsrss.bbc.co.uk/rss/newsonline_uk_edition/uk_politics/rss.xml') do |f|
  rss_content = f.read
end
rss = RSS::Parser.parse(rss_content, false)
# Loop through, analyse and display entities
rss.items.each do |item|
  page = collection.pages.create({:uri => item.guid.content}, {:realtime => true, :store => false})
  puts "#{item.guid.content} contains:"
  page.entities.each do |entity|
    puts "\t#{entity.term}, #{entity.classification}"
  end
end

Version data entries

6 entries across 6 versions & 1 rubygems

Version Path
muddyit_fu-0.2.14 examples/newsindexer.rb
muddyit_fu-0.2.13 examples/newsindexer.rb
muddyit_fu-0.2.12 examples/newsindexer.rb
muddyit_fu-0.2.11 examples/newsindexer.rb
muddyit_fu-0.2.10 examples/newsindexer.rb
muddyit_fu-0.2.9 examples/newsindexer.rb