# frozen_string_literal: true # # ronin-db-activerecord - ActiveRecord backend for the Ronin Database. # # Copyright (c) 2022-2023 Hal Brodigan (postmodern.mod3 at gmail.com) # # ronin-db-activerecord is free software: you can redistribute it and/or modify # it under the terms of the GNU Lesser General Public License as published # by the Free Software Foundation, either version 3 of the License, or # (at your option) any later version. # # ronin-db-activerecord is distributed in the hope that it will be useful, # but WITHOUT ANY WARRANTY; without even the implied warranty of # MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE. See the # GNU Lesser General Public License for more details. # # You should have received a copy of the GNU Lesser General Public License # along with ronin-db-activerecord. If not, see . # require 'ronin/db/model' require 'ronin/db/model/importable' require 'ronin/db/model/last_scanned_at' require 'active_record' require 'uri/generic' require 'uri/http' require 'uri/https' require 'uri/ftp' require 'uri/query_params' module Ronin module DB # # Represents parsed URLs. # class URL < ActiveRecord::Base include Model include Model::Importable include Model::LastScannedAt # Mapping of URL Schemes and URI classes SCHEMES = { 'https' => ::URI::HTTPS, 'http' => ::URI::HTTP, 'ftp' => ::URI::FTP } # @!attribute [rw] id # The primary key of the URL. # # @return [Integer] attribute :id, :integer # @!attribute [rw] scheme # The scheme of the URL. # # @return [URLScheme] belongs_to :scheme, required: true, class_name: 'URLScheme' # @!attribute [rw] host_name # The host name of the URL # # @return [HostName] belongs_to :host_name, required: true # @!attribute [rw] port # The port of the URL. # # @return [Port, nil] belongs_to :port, optional: true, class_name: 'Port' # @!attribute [rw] path # The path of the URL. # # @return [String] attribute :path, :string # @!attribute [rw] query # The query string part of the URL. # # @return [String, nil] attribute :query, :string # @!attribute [rw] fragment # The fragment of the URL. # # @return [String, nil] attribute :fragment, :string # @!attribute [r] created_at # Defines the created_at timestamp # # @return [Time] attribute :created_at, :time # @!attribute [rw] query_params # The query params of the URL. # # @return [Array] has_many :query_params, class_name: 'URLQueryParam', dependent: :destroy # @!attribute [rw] web_credentials # Any credentials used with the URL. # # @return [Array] has_many :web_credentials, dependent: :destroy # @!attribute [rw] credentials # The credentials that will work with this URL. # # @return [Array] has_many :credentials, through: :web_credentials # # Searches for all URLs using HTTP. # # @return [Array] # The matching URLs. # # @api public # def self.http joins(:scheme).where(scheme: {name: 'http'}) end # # Searches for all URLs using HTTPS. # # @return [Array] # The matching URLs. # # @api public # def self.https joins(:scheme).where(scheme: {name: 'https'}) end # # Searches for URLs with specific host name(s). # # @param [String, Array] name # The host name(s) to search for. # # @return [Array] # The matching URLs. # # @api public # def self.with_host_name(name) joins(:host_name).where(host_name: {name: name}) end # # Searches for URLs with the specific port number(s). # # @param [Integer, Array] number # The port number(s) to search for. # # @return [Array] # The matching URLs. # # @api public # def self.with_port_number(number) joins(:port).where(port: {number: number}) end # # Searches for all URLs with the exact path. # # @param [String] path # The path to search for. # # @return [Array] # The URL with the matching path. # # @api public # def self.with_path(path) where(path: path) end # # Searches for all URLs with the exact fragment. # # @param [String] fragment # The fragment to search for. # # @return [Array] # The URL with the matching fragment. # # @api public # def self.with_fragment(fragment) where(fragment: fragment) end # # Searches for all URLs sharing a common sub-directory. # # @param [String] root_dir # The sub-directory to search for. # # @return [Array] # The URL with the common sub-directory. # # @api public # def self.with_directory(root_dir) path_column = self.arel_table[:path] where(path: root_dir).or(where(path_column.matches("#{root_dir}/%"))) end # # Searches for all URLs sharing a common base name. # # @param [String] basename # The base name to search for. # # @return [Array] # The URL with the common base name. # # @api public # def self.with_basename(basename) path_column = self.arel_table[:path] where(path_column.matches("%/#{basename}")) end # # Searches for all URLs with a common file-extension. # # @param [String] ext # The file extension to search for. # # @return [Array] # The URLs with the common file-extension. # # @api public # def self.with_file_ext(ext) path_column = self.arel_table[:path] where(path_column.matches("%.#{sanitize_sql_like(ext)}")) end # # Searches for URLs with the given query param name and value. # # @param [String, Array] name # The query param name to search for. # # @param [String, Array] value # The query param value to search for. # # @return [Array] # The URLs with the given query param. # # @api public # def self.with_query_param(name,value) joins(query_params: :name).where( query_params: { ronin_url_query_param_names: {name: name}, value: value } ) end # # Search for all URLs with a given query param name. # # @param [Array, String] name # The query param name to search for. # # @return [Array] # The URLs with the given query param name. # # @api public # def self.with_query_param_name(name) joins(query_params: [:name]).where( query_params: { ronin_url_query_param_names: {name: name} } ) end # # Search for all URLs with a given query param value. # # @param [Array, String] value # The query param value to search for. # # @return [Array] # The URLs with the given query param value. # # @api public # def self.with_query_param_value(value) joins(:query_params).where(query_params: {value: value}) end # # Searches for a URL. # # @param [URI::HTTP, String] url # The URL to search for. # # @return [URL, nil] # The matching URL. # # @api public # def self.lookup(url) uri = URI(url) # create the initial query query = joins(:scheme, :host_name).where( scheme: {name: uri.scheme}, host_name: {name: uri.host}, path: normalized_path(uri), query: uri.query, fragment: uri.fragment ) if uri.port # query the port query = query.joins(:port).where(port: {number: uri.port}) end return query.first end # # Creates a new URL. # # @param [String, URI::HTTP] uri # The URI to create the URL from. # # @return [URL] # The new URL. # # @api public # def self.import(uri) uri = URI(uri) # find or create the URL scheme, host_name and port scheme = URLScheme.find_or_create_by(name: uri.scheme) host_name = HostName.find_or_create_by(name: uri.host) port = if uri.port Port.find_or_create_by( protocol: :tcp, number: uri.port ) end path = normalized_path(uri) query = uri.query fragment = uri.fragment # try to query a pre-existing URI then fallback to creating the URL # with query params. return find_or_create_by( scheme: scheme, host_name: host_name, port: port, path: path, query: query, fragment: fragment ) do |new_url| if uri.respond_to?(:query_params) # find or create the URL query params uri.query_params.each do |name,value| new_url.query_params << URLQueryParam.new( name: URLQueryParamName.find_or_create_by(name: name), value: value ) end end end end # # The host name of the URL. # # @return [String] # The address of host name. # # @api public # def host self.host_name.name end # # The port number used by the URL. # # @return [Integer, nil] # The port number. # # @api public # def port_number self.port.number if self.port end # # Builds a URI object from the URL. # # @return [URI::HTTP, URI::HTTPS] # The URI object created from the URL attributes. # # @api public # def to_uri # map the URL scheme to a URI class url_class = SCHEMES.fetch(self.scheme.name,::URI::Generic) scheme = if self.scheme self.scheme.name end host = if self.host_name self.host_name.name end port = if self.port self.port.number end # build the URI return url_class.build( scheme: scheme, host: host, port: port, path: self.path, query: self.query, fragment: self.fragment ) end # # Converts the URL to a String. # # @return [String] # The string form of the URL. # # @api public # def to_s self.to_uri.to_s end # # Normalizes the path of a URI. # # @param [URI] uri # The URI containing the path. # # @return [String, nil] # The normalized path. # # @api private # def self.normalized_path(uri) case uri when ::URI::HTTP # map empty HTTP paths to '/' unless uri.path.empty? then uri.path else '/' end else uri.path end end end end end require 'ronin/db/host_name' require 'ronin/db/port' require 'ronin/db/url_scheme' require 'ronin/db/url_query_param_name' require 'ronin/db/url_query_param' require 'ronin/db/web_credential'