Sha256: f827654adce4f42f818b300fd905dd15628e69cc84582033b8aadb9aac88878f
Contents?: true
Size: 469 Bytes
Versions: 33
Compression:
Stored size: 469 Bytes
Contents
require 'rubygems' require 'mechanize' agent = Mechanize.new agent.max_history = nil # unlimited history stack = agent.get(ARGV[0]).links while l = stack.pop next unless l.uri host = l.uri.host next unless host.nil? or host == agent.history.first.uri.host next if agent.visited? l.href puts "crawling #{l.uri}" begin page = l.click next unless Mechanize::Page === page stack.push(*page.links) rescue Mechanize::ResponseCodeError end end
Version data entries
33 entries across 33 versions & 2 rubygems