Sha256: 6a75e240b3e9e93f38c86a0987f2a3f63e92d9f9434c50e1bd26d90eea97a40c
Contents?: true
Size: 993 Bytes
Versions: 3
Compression:
Stored size: 993 Bytes
Contents
class DevTo::Scraper def get_page Nokogiri::HTML(open("https://dev.to/")) end def get_posts self.get_page.css(".articles-list .substories .single-article") end def make_posts self.get_posts.each do |data| post = DevTo::Post.new post.title = data.search(".content h3 span").remove post.title = data.search(".content h3").text.strip.gsub(/[[:space:]]+/," ") post.author = data.search("h4").text.strip post.tags = data.search(".tags .tag").collect { |tag| tag.text.strip} post.url = "https://dev.to" + data.search("a").last.attr("href") post.comments = data.search(".engagement-count-number").first.text.strip post.likes = data.search(".engagement-count-number").last.text.strip end end def make_content(post) post_page = Nokogiri::HTML(open("#{post.url}")) post.content = post_page.search("body #article-body").text.strip post.date = post_page.search("#main-title .published-at").text.strip end end
Version data entries
3 entries across 3 versions & 1 rubygems
Version | Path |
---|---|
dev_to-0.1.3 | lib/dev_to/scraper.rb |
dev_to-0.1.2 | lib/dev_to/scraper.rb |
dev_to-0.1.0 | lib/dev_to/scraper.rb |