Sha256: efe685a03606e2b22d1b3497aa33199c36001e068a40efbd4e7ac6fb7c2a1328
Contents?: true
Size: 1.31 KB
Versions: 2
Compression:
Stored size: 1.31 KB
Contents
# frozen_string_literal: true require_relative "./feeds/feed" require_relative "./feeds/ayashige" require_relative "./feeds/urlscan" module Miteru class Feeds def initialize(size: 100, directory_traveling: false) @feeds = [ Ayashige.new, UrlScan.new(size) ] @directory_traveling = directory_traveling end def directory_traveling? @directory_traveling end def suspicious_urls @suspicious_urls ||= [].tap do |arr| urls = @feeds.map do |feed| feed.urls.select { |url| url.start_with?("http://", "https://") } end.flatten.uniq urls.map { |url| breakdown(url) }.flatten.uniq.sort.each { |url| arr << url } end end def breakdown(url) begin uri = URI.parse(url) rescue URI::InvalidURIError => _e return [] end base = "#{uri.scheme}://#{uri.hostname}" return [base] unless directory_traveling? segments = uri.path.split("/") return [base] if segments.length.zero? urls = (0...segments.length).map { |idx| "#{base}#{segments[0..idx].join('/')}" } urls.reject do |breakdowned_url| # Reject a url which ends with specific extension names %w(.htm .html .php .asp .aspx).any? { |ext| breakdowned_url.end_with? ext } end end end end
Version data entries
2 entries across 2 versions & 1 rubygems
Version | Path |
---|---|
miteru-0.12.6 | lib/miteru/feeds.rb |
miteru-0.12.5 | lib/miteru/feeds.rb |