Sha256: 6faa7994d44498ecfe454bf87efc2ee62773b68652378d1536cf4dd0cc7d80c1

Contents?: true

Size: 1.92 KB

Versions: 1

Compression:

Stored size: 1.92 KB

Contents

require 'spec_helper'
require 'moped'

describe Spidey::Strategies::Moped do
  class TestMopedSpider < Spidey::AbstractSpider
    include Spidey::Strategies::Moped
    handle 'http://www.cnn.com', :process_home

    def result_key(data)
      data[:detail_url]
    end
  end

  before(:each) do
    @db = Moped::Session.new(['127.0.0.1:27017'])
    @db.use 'spidey-mongo-test'
    @spider = TestMopedSpider.new(
      url_collection: @db['urls'],
      result_collection: @db['results'],
      error_collection: @db['errors'])
  end

  after(:each) do
    %w( urls results errors ).each { |col| @db[col].drop }
  end

  it 'should add initial URLs to collection' do
    doc = @db['urls'].find(url: 'http://www.cnn.com').first
    expect(doc['handler']).to eq(:process_home)
    expect(doc['spider']).to eq('TestMopedSpider')
  end

  it 'should not add duplicate URLs' do
    @spider.send :handle, 'http://www.cnn.com', :process_home
    expect(@db['urls'].find(url: 'http://www.cnn.com').count).to eq(1)
  end

  it 'should add results' do
    @spider.record detail_url: 'http://www.cnn.com', foo: 'bar'
    expect(@db['results'].find.count).to eq(1)
    doc = @db['results'].find.first
    expect(doc['detail_url']).to eq('http://www.cnn.com')
    expect(doc['foo']).to eq('bar')
    expect(doc['spider']).to eq('TestMopedSpider')
  end

  it 'should update existing result' do
    @db['results'].insert key: 'http://foo.bar', detail_url: 'http://foo.bar'
    @spider.record detail_url: 'http://foo.bar', foo: 'bar'
    expect(@db['results'].find.count).to eq(1)
  end

  it 'should add error' do
    @spider.add_error error: Exception.new('WTF'), url: 'http://www.cnn.com', handler: :blah
    doc = @db['errors'].find.first
    expect(doc['error']).to eq('Exception')
    expect(doc['url']).to eq('http://www.cnn.com')
    expect(doc['handler']).to eq(:blah)
    expect(doc['message']).to eq('WTF')
    expect(doc['spider']).to eq('TestMopedSpider')
  end
end

Version data entries

1 entries across 1 versions & 1 rubygems

Version Path
spidey-mongo-0.3.0 spec/spidey/strategies/moped_spec.rb