Sha256: e9da9893845909188166510acbf0952bc644889788390032c8679c287a9f2f2b

Contents?: true

Size: 1.77 KB

Versions: 15

Compression:

Stored size: 1.77 KB

Contents

module CMSScanner
  # Scope system logic
  class Target < WebSite
    # @return [ Array<PublicSuffix::Domain, String> ]
    def scope
      @scope ||= Scope.new
    end

    # @param [ String ] url An absolute URL
    #
    # @return [ Boolean ] true if the url given is in scope
    def in_scope?(url)
      scope.include?(Addressable::URI.parse(url.strip).host)
    rescue StandardError
      false
    end

    # @param [ Typhoeus::Response ] res
    # @param [ String ] xpath
    #
    # @yield [ String, Nokogiri::XML::Element ] The in scope url and its associated tag
    #
    # @return [ Array<String> ] The in scope absolute URLs detected in the response's body
    def in_scope_urls(res, xpath = '//@href|//@src|//@data-src')
      found = []

      urls_from_page(res, xpath) do |url, tag|
        next unless in_scope?(url)

        yield url, tag if block_given?

        found << url
      end

      found
    end

    # Scope Implementation
    class Scope
      # @return [ Array<PublicSuffix::Domain ] The valid domains in scope
      def domains
        @domains ||= []
      end

      # @return [ Array<String> ] The invalid domains in scope (such as IP addresses etc)
      def invalid_domains
        @invalid_domains ||= []
      end

      def <<(element)
        if PublicSuffix.valid?(element)
          domains << PublicSuffix.parse(element)
        else
          invalid_domains << element
        end
      end

      # @return [ Boolean ] Wether or not the host is in the scope
      def include?(host)
        if PublicSuffix.valid?(host)
          domain = PublicSuffix.parse(host)

          domains.each { |d| return true if domain.match(d) }
        else
          invalid_domains.each { |d| return true if host == d }
        end

        false
      end
    end
  end
end

Version data entries

15 entries across 15 versions & 1 rubygems

Version Path
cms_scanner-0.0.41.10 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.9 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.8 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.7 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.6 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.5 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.4 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.3 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.2 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.1 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.41.0 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.40.3 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.40.2 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.40.1 lib/cms_scanner/target/scope.rb
cms_scanner-0.0.40 lib/cms_scanner/target/scope.rb