require 'rsolr' module ActiveFedora class SolrService attr_reader :conn def initialize(host, args) host = 'http://localhost:8080/solr' unless host args = {:read_timeout => 120, :open_timeout => 120}.merge(args.dup) args.merge!(:url=>host) @conn = RSolr.connect args end class << self def register(host=nil, args={}) Thread.current[:solr_service] = new(host, args) end def reset! Thread.current[:solr_service] = nil end def instance # Register Solr unless Thread.current[:solr_service] register(ActiveFedora.solr_config[:url]) end raise SolrNotInitialized unless Thread.current[:solr_service] Thread.current[:solr_service] end def lazy_reify_solr_results(solr_results, opts = {}) Enumerator.new do |yielder| solr_results.each do |hit| yielder.yield(reify_solr_result(hit, opts)) end end end def reify_solr_results(solr_results, opts = {}) solr_results.collect {|hit| reify_solr_result(hit, opts)} end def reify_solr_result(hit, opts = {}) klass = class_from_solr_document(hit) if opts[:load_from_solr] klass.load_instance_from_solr(hit[SOLR_DOCUMENT_ID], hit) else klass.find(hit[SOLR_DOCUMENT_ID], cast: true) end end #Returns the best singular class for the solr object def class_from_solr_document(hit, opts = {}) #Set the default starting point to the class specified, if available. best_model_match = Model.from_class_uri(opts[:class]) unless opts[:class].nil? hit[HAS_MODEL_SOLR_FIELD].each do |value| model_value = Model.from_class_uri(value) if model_value # Set as the first model in case opts[:class] was nil best_model_match ||= model_value # If there is an inheritance structure, use the most specific case. if best_model_match > model_value best_model_match = model_value end end end ActiveFedora::Base.logger.warn "Could not find a model for #{hit["id"]}, defaulting to ActiveFedora::Base" unless best_model_match if ActiveFedora::Base.logger best_model_match || ActiveFedora::Base end # Construct a solr query for a list of pids # This is used to get a solr response based on the list of pids in an object's RELS-EXT relationhsips # If the pid_array is empty, defaults to a query of "id:NEVER_USE_THIS_ID", which will return an empty solr response # @param [Array] pid_array the pids that you want included in the query def construct_query_for_pids(pid_array) q = pid_array.reject { |x| x.empty? }.map { |pid| raw_query(SOLR_DOCUMENT_ID, pid) } q.empty? ? "id:NEVER_USE_THIS_ID" : q.join(" OR ".freeze) end # Create a raw query clause suitable for sending to solr as an fq element # @param [String] key # @param [String] value def raw_query(key, value) "_query_:\"{!raw f=#{key}}#{value.gsub('"', '\"')}\"" end def solr_name(*args) Solrizer.default_field_mapper.solr_name(*args) end # Create a query with a clause for each key, value # @param [Hash, Array>] args key is the predicate, value is the target_uri # @param [String] join_with ('AND') the value we're joining the clauses with # @example # construct_query_for_rel [[:has_model, "info:fedora/afmodel:ComplexCollection"], [:has_model, "info:fedora/afmodel:ActiveFedora_Base"]], 'OR' # # => _query_:"{!raw f=has_model_ssim}info:fedora/afmodel:ComplexCollection" OR _query_:"{!raw f=has_model_ssim}info:fedora/afmodel:ActiveFedora_Base" def construct_query_for_rel(field_pairs, join_with = 'AND') field_pairs = field_pairs.to_a if field_pairs.kind_of? Hash clauses = field_pairs.map { |(predicate, target_uri)| raw_query(solr_name(predicate, :symbol), target_uri) } clauses.join(" #{join_with} ".freeze) end def query(query, args={}) raw = args.delete(:raw) args = args.merge(:q=>query, :qt=>'standard') result = SolrService.instance.conn.get('select', :params=>args) return result if raw result['response']['docs'] end # Get the count of records that match the query # @param [String] query a solr query # @param [Hash] args arguments to pass through to `args' param of SolrService.query (note that :rows will be overwritten to 0) # @return [Integer] number of records matching def count(query, args={}) args = args.merge(:raw=>true, :rows=>0) SolrService.query(query, args)['response']['numFound'].to_i end # @param [Hash] doc the document to index # @param [Hash] params # :commit => commits immediately # :softCommit => commit to memory, but don't flush to disk def add(doc, params = {}) SolrService.instance.conn.add(doc, params: params) end def commit SolrService.instance.conn.commit end end HAS_MODEL_SOLR_FIELD = solr_name("has_model", :symbol).freeze end #SolrService class SolrNotInitialized < StandardError;end end #ActiveFedora