# Copyright 2015 Google Inc. All rights reserved.
#
# Licensed under the Apache License, Version 2.0 (the "License");
# you may not use this file except in compliance with the License.
# You may obtain a copy of the License at
#
# http://www.apache.org/licenses/LICENSE-2.0
#
# Unless required by applicable law or agreed to in writing, software
# distributed under the License is distributed on an "AS IS" BASIS,
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
# See the License for the specific language governing permissions and
# limitations under the License.
require "gcloud/search/document/list"
require "gcloud/search/connection"
require "gcloud/search/fields"
module Gcloud
module Search
##
# # Document
#
# A document is an object that stores data that can be searched. Each
# document has a {Gcloud::Search::Document#doc_id} that is unique within its
# index, a {Gcloud::Search::Document#rank}, and a list of
# {Gcloud::Search::Document#fields} that contain typed data. Its field
# values can be accessed through hash-like methods such as
# {Gcloud::Search::Document#[]} and {Gcloud::Search::Document#each}.
#
# @example
# require "gcloud"
#
# gcloud = Gcloud.new
# search = gcloud.search
# index = search.index "products"
#
# document = index.document "product-sku-000001"
# document.add "price", 24.95
# index.save document
# document.rank #=> 1443648166
# document["price"] #=> 24.95
#
# @see https://cloud.google.com/search/documents_indexes Documents and
# Indexes
#
class Document
##
# @private Creates a new Document instance.
#
def initialize
@fields = Fields.new
@raw = {}
end
##
# The unique identifier for the document. Can be set explicitly when the
# document is saved. (See {Gcloud::Search::Index#document} and
# {Gcloud::Search::Document#doc_id=}.) If missing, it is automatically
# assigned to the document when saved.
def doc_id
@raw["docId"]
end
##
# Sets the unique identifier for the document.
#
# Must contain only visible, printable ASCII characters (ASCII codes 33
# through 126 inclusive) and be no longer than 500 characters. It cannot
# begin with an exclamation point (!
), and it cannot begin
# and end with double underscores (__
).
def doc_id= new_doc_id
@raw["docId"] = new_doc_id
end
##
# A positive integer which determines the default ordering of documents
# returned from a search. The rank can be set explicitly when the document
# is saved. (See {Gcloud::Search::Index#document} and
# {Gcloud::Search::Document#rank=}.) If missing, it is automatically
# assigned to the document when saved.
def rank
@raw["rank"]
end
##
# Sets the rank of the document.
#
# The same rank should not be assigned to many documents, and should never
# be assigned to more than 10,000 documents. By default (when it is not
# specified or set to 0), it is set at the time the document is created to
# the number of seconds since January 1, 2011. The rank can be used in
# {Gcloud::Search::Index#search} options `expressions`, `order`, and
# `fields`, where it is referenced as `rank`.
def rank= new_rank
@raw["rank"] = new_rank
end
##
# Retrieve the field values associated to a field name.
#
# @param [String] name The name of the field. New values will be
# configured with this name.
#
# @return [FieldValues]
#
# @example
# require "gcloud"
#
# gcloud = Gcloud.new
# search = gcloud.search
# index = search.index "products"
#
# document = index.document "product-sku-000001"
# puts "The document description is:"
# document["description"].each do |value|
# puts "* #{value} (#{value.type}) [#{value.lang}]"
# end
#
def [] name
@fields[name]
end
# Trivial accessor because we want .fields to be listed with methods.
##
# The fields in the document. Each field has a name (String) and a list of
# values ({FieldValues}). (See {Fields})
def fields
@fields
end
##
# Add a new value. If the field name does not exist it will be added. If
# the field value is a DateTime or Numeric, or the type is set to
# `:datetime` or `:number`, then the added value will replace any existing
# values of the same type (since there can be only one).
#
# @param [String] name The name of the field.
# @param [String, Datetime, Float] value The value to add to the field.
# @param [Symbol] type The type of the field value. An attempt is made to
# set the correct type when this option is missing, although it must be
# provided for `:geo` values. A field can have multiple values with same
# or different types; however, it cannot have multiple `:datetime` or
# `:number` values.
#
# The following values are supported:
#
# * `:default` - The value is a string. The format will be automatically
# detected. This is the default value for strings.
# * `:text` - The value is a string with maximum length 1024**2
# characters.
# * `:html` - The value is an HTML-formatted string with maximum length
# 1024**2 characters.
# * `:atom` - The value is a string with maximum length 500 characters.
# * `:geo` - The value is a point on earth described by latitude and
# longitude coordinates, represented in string with any of the listed
# [ways of writing coordinates](http://en.wikipedia.org/wiki/Geographic_coordinate_conversion).
# * `:datetime` - The value is a `DateTime`.
# * `:number` - The value is a `Numeric` between -2,147,483,647 and
# 2,147,483,647. The value will be stored as a double precision
# floating point value in Cloud Search.
# @param [String] lang The language of a string value. Must be a valid
# [ISO 639-1 code](https://en.wikipedia.org/wiki/List_of_ISO_639-1_codes).
#
# @example
# require "gcloud"
#
# gcloud = Gcloud.new
# search = gcloud.search
# index = search.index "products"
#
# document = index.document "product-sku-000001"
# document.add "sku", "product-sku-000001", type: :atom
# document.add "description", "The best T-shirt ever.",
# type: :text, lang: "en"
# document.add "description", "
The best T-shirt ever.
", # type: :html, lang: "en" # document.add "price", 24.95 # def add name, value, type: nil, lang: nil @fields[name].add value, type: type, lang: lang end ## # Deletes a field and all values. (See {Fields#delete}) # # @param [String] name The name of the field. # # @example # require "gcloud" # # gcloud = Gcloud.new # search = gcloud.search # index = search.index "products" # # document = index.document "product-sku-000001" # document.delete "description" # def delete name, &block @fields.delete name, &block end ## # Calls block once for each field, passing the field name and values pair # as parameters. If no block is given an enumerator is returned instead. # (See {Fields#each}) # # @example # require "gcloud" # # gcloud = Gcloud.new # search = gcloud.search # index = search.index "products" # # document = index.document "product-sku-000001" # puts "The document #{document.doc_id} has the following fields:" # document.each do |name, values| # puts "* #{name}:" # values.each do |value| # puts " * #{value} (#{value.type})" # end # end # def each &block @fields.each(&block) end ## # Returns a new array populated with all the field names. # (See {Fields#names}) # # @example # require "gcloud" # # gcloud = Gcloud.new # search = gcloud.search # index = search.index "products" # # document = index.document "product-sku-000001" # puts "The document #{document.doc_id} has the following fields:" # document.names.each do |name| # puts "* #{name}:" # end # def names @fields.names end ## # @private Override to keep working in interactive shells manageable. def inspect insp_rank = "" insp_rank = ", rank: #{rank}" if rank insp_fields = ", fields: (#{fields.names.map(&:inspect).join ', '})" "#{self.class}(doc_id: #{doc_id.inspect}#{insp_rank}#{insp_fields})" end ## # @private New Document from a raw data object. def self.from_hash hash doc = new doc.instance_variable_set "@raw", hash doc.instance_variable_set "@fields", Fields.from_raw(hash["fields"]) doc end ## # @private Returns the Document data as a hash def to_hash hash = @raw.dup hash["fields"] = @fields.to_raw hash end end end end