# Copyright 2015 Google Inc. All rights reserved. # # Licensed under the Apache License, Version 2.0 (the "License"); # you may not use this file except in compliance with the License. # You may obtain a copy of the License at # # http://www.apache.org/licenses/LICENSE-2.0 # # Unless required by applicable law or agreed to in writing, software # distributed under the License is distributed on an "AS IS" BASIS, # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. # See the License for the specific language governing permissions and # limitations under the License. require "google/cloud/errors" require "google/cloud/bigquery/service" require "google/cloud/bigquery/view" require "google/cloud/bigquery/data" require "google/cloud/bigquery/table/list" require "google/cloud/bigquery/schema" require "google/cloud/bigquery/insert_response" require "google/apis/bigquery_v2" module Google module Cloud module Bigquery ## # # Table # # A named resource representing a BigQuery table that holds zero or more # records. Every table is defined by a schema that may contain nested and # repeated fields. # # @see https://cloud.google.com/bigquery/preparing-data-for-bigquery # Preparing Data for BigQuery # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # # table = dataset.create_table "my_table" do |schema| # schema.string "first_name", mode: :required # schema.record "cities_lived", mode: :repeated do |nested_schema| # nested_schema.string "place", mode: :required # nested_schema.integer "number_of_years", mode: :required # end # end # # row = { # "first_name" => "Alice", # "cities_lived" => [ # { # "place" => "Seattle", # "number_of_years" => 5 # }, # { # "place" => "Stockholm", # "number_of_years" => 6 # } # ] # } # table.insert row # class Table ## # @private The Service object. attr_accessor :service ## # @private The Google API Client object. attr_accessor :gapi ## # @private Create an empty Table object. def initialize @service = nil @gapi = Google::Apis::BigqueryV2::Table.new end ## # A unique ID for this table. # The ID must contain only letters (a-z, A-Z), numbers (0-9), # or underscores (_). The maximum length is 1,024 characters. # # @!group Attributes # def table_id @gapi.table_reference.table_id end ## # The ID of the `Dataset` containing this table. # # @!group Attributes # def dataset_id @gapi.table_reference.dataset_id end ## # The ID of the `Project` containing this table. # # @!group Attributes # def project_id @gapi.table_reference.project_id end ## # @private The gapi fragment containing the Project ID, Dataset ID, and # Table ID as a camel-cased hash. def table_ref table_ref = @gapi.table_reference table_ref = table_ref.to_hash if table_ref.respond_to? :to_hash table_ref end ## # The combined Project ID, Dataset ID, and Table ID for this table, in # the format specified by the [Query # Reference](https://cloud.google.com/bigquery/query-reference#from): # `project_name:datasetId.tableId`. To use this value in queries see # {#query_id}. # # @!group Attributes # def id @gapi.id end ## # The value returned by {#id}, wrapped in square brackets if the Project # ID contains dashes, as specified by the [Query # Reference](https://cloud.google.com/bigquery/query-reference#from). # Useful in queries. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # data = bigquery.query "SELECT name FROM #{table.query_id}" # # @!group Attributes # def query_id project_id["-"] ? "[#{id}]" : id end ## # The name of the table. # # @!group Attributes # def name @gapi.friendly_name end ## # Updates the name of the table. # # @!group Attributes # def name= new_name @gapi.update! friendly_name: new_name patch_gapi! :friendly_name end ## # A string hash of the dataset. # # @!group Attributes # def etag ensure_full_data! @gapi.etag end ## # A URL that can be used to access the dataset using the REST API. # # @!group Attributes # def api_url ensure_full_data! @gapi.self_link end ## # The description of the table. # # @!group Attributes # def description ensure_full_data! @gapi.description end ## # Updates the description of the table. # # @!group Attributes # def description= new_description @gapi.update! description: new_description patch_gapi! :description end ## # The number of bytes in the table. # # @!group Data # def bytes_count ensure_full_data! begin Integer @gapi.num_bytes rescue nil end end ## # The number of rows in the table. # # @!group Data # def rows_count ensure_full_data! begin Integer @gapi.num_rows rescue nil end end ## # The time when this table was created. # # @!group Attributes # def created_at ensure_full_data! begin Time.at(Integer(@gapi.creation_time) / 1000.0) rescue nil end end ## # The time when this table expires. # If not present, the table will persist indefinitely. # Expired tables will be deleted and their storage reclaimed. # # @!group Attributes # def expires_at ensure_full_data! begin Time.at(Integer(@gapi.expiration_time) / 1000.0) rescue nil end end ## # The date when this table was last modified. # # @!group Attributes # def modified_at ensure_full_data! begin Time.at(Integer(@gapi.last_modified_time) / 1000.0) rescue nil end end ## # Checks if the table's type is "TABLE". # # @!group Attributes # def table? @gapi.type == "TABLE" end ## # Checks if the table's type is "VIEW". # # @!group Attributes # def view? @gapi.type == "VIEW" end ## # The geographic location where the table should reside. Possible # values include EU and US. The default value is US. # # @!group Attributes # def location ensure_full_data! @gapi.location end ## # Returns the table's schema. This method can also be used to set, # replace, or add to the schema by passing a block. See {Schema} for # available methods. # # @param [Boolean] replace Whether to replace the existing schema with # the new schema. If `true`, the fields will replace the existing # schema. If `false`, the fields will be added to the existing schema. # When a table already contains data, schema changes must be additive. # Thus, the default value is `false`. # @yield [schema] a block for setting the schema # @yieldparam [Schema] schema the object accepting the schema # # @return [Google::Cloud::Bigquery::Schema] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" # # table.schema do |schema| # schema.string "first_name", mode: :required # schema.record "cities_lived", mode: :repeated do |nested_schema| # nested_schema.string "place", mode: :required # nested_schema.integer "number_of_years", mode: :required # end # end # # @!group Attributes # def schema replace: false ensure_full_data! schema_builder = Schema.from_gapi @gapi.schema if block_given? if replace empty_schema = Google::Apis::BigqueryV2::TableSchema.new( fields: []) schema_builder = Schema.from_gapi empty_schema end yield schema_builder schema_builder.check_for_mutated_schema! if schema_builder.changed? @gapi.schema = schema_builder.to_gapi patch_gapi! :schema end end schema_builder.freeze end ## # The fields of the table. # # @!group Attributes # def fields schema.fields end ## # The names of the columns in the table. # # @!group Attributes # def headers fields.map(&:name) end ## # Retrieves data from the table. # # @param [String] token Page token, returned by a previous call, # identifying the result set. # # @param [Integer] max Maximum number of results to return. # @param [Integer] start Zero-based index of the starting row to read. # # @return [Google::Cloud::Bigquery::Data] # # @example Paginate rows of data: (See {Data#next}) # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # data = table.data # data.each do |row| # puts row["first_name"] # end # if data.next? # more_data = data.next if data.next? # end # # @example Retrieve all rows of data: (See {Data#all}) # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # data = table.data # data.all do |row| # puts row["first_name"] # end # # @!group Data # def data token: nil, max: nil, start: nil ensure_service! options = { token: token, max: max, start: start } gapi = service.list_tabledata dataset_id, table_id, options Data.from_gapi gapi, self end ## # Copies the data from the table to another table. The destination table # argument can also be a string identifier as specified by the [Query # Reference](https://cloud.google.com/bigquery/query-reference#from): # `project_name:datasetId.tableId`. This is useful for referencing # tables in other projects and datasets. # # @param [Table, String] destination_table The destination for the # copied data. # @param [String] create Specifies whether the job is allowed to create # new tables. # # The following values are supported: # # * `needed` - Create the table if it does not exist. # * `never` - The table must already exist. A 'notFound' error is # raised if the table does not exist. # @param [String] write Specifies how to handle data already present in # the destination table. The default value is `empty`. # # The following values are supported: # # * `truncate` - BigQuery overwrites the table data. # * `append` - BigQuery appends the data to the table. # * `empty` - An error will be returned if the destination table # already contains data. # # @return [Google::Cloud::Bigquery::CopyJob] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # destination_table = dataset.table "my_destination_table" # # copy_job = table.copy destination_table # # @example Passing a string identifier for the destination table: # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # copy_job = table.copy "other-project:other_dataset.other_table" # # @!group Data # def copy destination_table, create: nil, write: nil, dryrun: nil ensure_service! options = { create: create, write: write, dryrun: dryrun } gapi = service.copy_table table_ref, get_table_ref(destination_table), options Job.from_gapi gapi, service end ## # Extract the data from the table to a Google Cloud Storage file. # # @see https://cloud.google.com/bigquery/exporting-data-from-bigquery # Exporting Data From BigQuery # # @param [Google::Cloud::Storage::File, String, Array] # extract_url The Google Storage file or file URI pattern(s) to which # BigQuery should extract the table data. # @param [String] format The exported file format. The default value is # `csv`. # # The following values are supported: # # * `csv` - CSV # * `json` - [Newline-delimited JSON](http://jsonlines.org/) # * `avro` - [Avro](http://avro.apache.org/) # @param [String] compression The compression type to use for exported # files. Possible values include `GZIP` and `NONE`. The default value # is `NONE`. # @param [String] delimiter Delimiter to use between fields in the # exported data. Default is ,. # @param [Boolean] header Whether to print out a header row in the # results. Default is `true`. # # # @return [Google::Cloud::Bigquery::ExtractJob] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # extract_job = table.extract "gs://my-bucket/file-name.json", # format: "json" # # @!group Data # def extract extract_url, format: nil, compression: nil, delimiter: nil, header: nil, dryrun: nil ensure_service! options = { format: format, compression: compression, delimiter: delimiter, header: header, dryrun: dryrun } gapi = service.extract_table table_ref, extract_url, options Job.from_gapi gapi, service end ## # Loads data into the table. You can pass a google-cloud storage file # path or a google-cloud storage file instance. Or, you can upload a # file directly. See [Loading Data with a POST Request]( # https://cloud.google.com/bigquery/loading-data-post-request#multipart). # # @param [File, Google::Cloud::Storage::File, String] file A file or the # URI of a Google Cloud Storage file containing data to load into the # table. # @param [String] format The exported file format. The default value is # `csv`. # # The following values are supported: # # * `csv` - CSV # * `json` - [Newline-delimited JSON](http://jsonlines.org/) # * `avro` - [Avro](http://avro.apache.org/) # * `datastore_backup` - Cloud Datastore backup # @param [String] create Specifies whether the job is allowed to create # new tables. # # The following values are supported: # # * `needed` - Create the table if it does not exist. # * `never` - The table must already exist. A 'notFound' error is # raised if the table does not exist. # @param [String] write Specifies how to handle data already present in # the table. The default value is `empty`. # # The following values are supported: # # * `truncate` - BigQuery overwrites the table data. # * `append` - BigQuery appends the data to the table. # * `empty` - An error will be returned if the table already contains # data. # @param [Array] projection_fields If the `format` option is set # to `datastore_backup`, indicates which entity properties to load # from a Cloud Datastore backup. Property names are case sensitive and # must be top-level properties. If not set, BigQuery loads all # properties. If any named property isn't found in the Cloud Datastore # backup, an invalid error is returned. # @param [Boolean] jagged_rows Accept rows that are missing trailing # optional columns. The missing values are treated as nulls. If # `false`, records with missing trailing columns are treated as bad # records, and if there are too many bad records, an invalid error is # returned in the job result. The default value is `false`. Only # applicable to CSV, ignored for other formats. # @param [Boolean] quoted_newlines Indicates if BigQuery should allow # quoted data sections that contain newline characters in a CSV file. # The default value is `false`. # @param [String] encoding The character encoding of the data. The # supported values are `UTF-8` or `ISO-8859-1`. The default value is # `UTF-8`. # @param [String] delimiter Specifices the separator for fields in a CSV # file. BigQuery converts the string to `ISO-8859-1` encoding, and # then uses the first byte of the encoded string to split the data in # its raw, binary state. Default is ,. # @param [Boolean] ignore_unknown Indicates if BigQuery should allow # extra values that are not represented in the table schema. If true, # the extra values are ignored. If false, records with extra columns # are treated as bad records, and if there are too many bad records, # an invalid error is returned in the job result. The default value is # `false`. # # The `format` property determines what BigQuery treats as an extra # value: # # * `CSV`: Trailing columns # * `JSON`: Named values that don't match any column names # @param [Integer] max_bad_records The maximum number of bad records # that BigQuery can ignore when running the job. If the number of bad # records exceeds this value, an invalid error is returned in the job # result. The default value is `0`, which requires that all records # are valid. # @param [String] quote The value that is used to quote data sections in # a CSV file. BigQuery converts the string to ISO-8859-1 encoding, and # then uses the first byte of the encoded string to split the data in # its raw, binary state. The default value is a double-quote # ". If your data does not contain quoted sections, set # the property value to an empty string. If your data contains quoted # newline characters, you must also set the allowQuotedNewlines # property to true. # @param [Integer] skip_leading The number of rows at the top of a CSV # file that BigQuery will skip when loading the data. The default # value is `0`. This property is useful if you have header rows in the # file that should be skipped. # # @return [Google::Cloud::Bigquery::LoadJob] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # load_job = table.load "gs://my-bucket/file-name.csv" # # @example Pass a google-cloud storage file instance: # require "google/cloud" # require "google/cloud/storage" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # storage = gcloud.storage # bucket = storage.bucket "my-bucket" # file = bucket.file "file-name.csv" # load_job = table.load file # # @example Upload a file directly: # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # file = File.open "my_data.csv" # load_job = table.load file # # @!group Data # def load file, format: nil, create: nil, write: nil, projection_fields: nil, jagged_rows: nil, quoted_newlines: nil, encoding: nil, delimiter: nil, ignore_unknown: nil, max_bad_records: nil, quote: nil, skip_leading: nil, dryrun: nil ensure_service! options = { format: format, create: create, write: write, projection_fields: projection_fields, jagged_rows: jagged_rows, quoted_newlines: quoted_newlines, encoding: encoding, delimiter: delimiter, ignore_unknown: ignore_unknown, max_bad_records: max_bad_records, quote: quote, skip_leading: skip_leading, dryrun: dryrun } return load_storage(file, options) if storage_url? file return load_local(file, options) if local_file? file fail Google::Cloud::Error, "Don't know how to load #{file}" end ## # Inserts data into the table for near-immediate querying, without the # need to complete a #load operation before the data can appear in query # results. # # @see https://cloud.google.com/bigquery/streaming-data-into-bigquery # Streaming Data Into BigQuery # # @param [Hash, Array] rows A hash object or array of hash objects # containing the data. # @param [Boolean] skip_invalid Insert all valid rows of a request, even # if invalid rows exist. The default value is `false`, which causes # the entire request to fail if any invalid rows exist. # @param [Boolean] ignore_unknown Accept rows that contain values that # do not match the schema. The unknown values are ignored. Default is # false, which treats unknown values as errors. # # @return [Google::Cloud::Bigquery::InsertResponse] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # rows = [ # { "first_name" => "Alice", "age" => 21 }, # { "first_name" => "Bob", "age" => 22 } # ] # table.insert rows # # @!group Data # def insert rows, skip_invalid: nil, ignore_unknown: nil rows = [rows] if rows.is_a? Hash ensure_service! options = { skip_invalid: skip_invalid, ignore_unknown: ignore_unknown } gapi = service.insert_tabledata dataset_id, table_id, rows, options InsertResponse.from_gapi rows, gapi end ## # Permanently deletes the table. # # @return [Boolean] Returns `true` if the table was deleted. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.table "my_table" # # table.delete # # @!group Lifecycle # def delete ensure_service! service.delete_table dataset_id, table_id true end ## # Reloads the table with current data from the BigQuery service. # # @!group Lifecycle # def reload! ensure_service! gapi = service.get_table dataset_id, table_id @gapi = gapi end alias_method :refresh!, :reload! ## # @private New Table from a Google API Client object. def self.from_gapi gapi, conn klass = class_for gapi klass.new.tap do |f| f.gapi = gapi f.service = conn end end protected ## # Raise an error unless an active service is available. def ensure_service! fail "Must have active connection" unless service end def patch_gapi! *attributes return if attributes.empty? ensure_service! patch_args = Hash[attributes.map do |attr| [attr, @gapi.send(attr)] end] patch_gapi = Google::Apis::BigqueryV2::Table.new patch_args @gapi = service.patch_table dataset_id, table_id, patch_gapi end def self.class_for gapi return View if gapi.type == "VIEW" self end def load_storage url, options = {} # Convert to storage URL url = url.to_gs_url if url.respond_to? :to_gs_url gapi = service.load_table_gs_url dataset_id, table_id, url, options Job.from_gapi gapi, service end def load_local file, options = {} # Convert to storage URL file = file.to_gs_url if file.respond_to? :to_gs_url gapi = service.load_table_file dataset_id, table_id, file, options Job.from_gapi gapi, service end def storage_url? file file.respond_to?(:to_gs_url) || (file.respond_to?(:to_str) && file.to_str.downcase.start_with?("gs://")) end def local_file? file ::File.file? file rescue false end ## # Load the complete representation of the table if it has been # only partially loaded by a request to the API list method. def ensure_full_data! reload_gapi! unless data_complete? end def reload_gapi! ensure_service! gapi = service.get_table dataset_id, table_id @gapi = gapi end def data_complete? @gapi.is_a? Google::Apis::BigqueryV2::Table end private def get_table_ref table if table.respond_to? :table_ref table.table_ref else Service.table_ref_from_s table, table_ref end end ## # Yielded to a block to accumulate changes for a patch request. class Updater < Table ## # A list of attributes that were updated. attr_reader :updates ## # Create an Updater object. def initialize gapi @updates = [] @gapi = gapi @schema = nil end ## # Returns the table's schema. This method can also be used to set, # replace, or add to the schema by passing a block. See {Schema} for # available methods. # # @param [Boolean] replace Whether to replace the existing schema with # the new schema. If `true`, the fields will replace the existing # schema. If `false`, the fields will be added to the existing # schema. When a table already contains data, schema changes must be # additive. Thus, the default value is `false`. # @yield [schema] a block for setting the schema # @yieldparam [Schema] schema the object accepting the schema # # @return [Google::Cloud::Bigquery::Schema] # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |t| # t.name = "My Table", # t.description = "A description of my table." # t.schema do |s| # s.string "first_name", mode: :required # s.record "cities_lived", mode: :repeated do |r| # r.string "place", mode: :required # r.integer "number_of_years", mode: :required # end # end # end # # @!group Schema # def schema replace: false # Same as Table#schema, but not frozen # TODO: make sure to call ensure_full_data! on Dataset#update @schema ||= Schema.from_gapi @gapi.schema if block_given? if replace @schema = Schema.from_gapi \ Google::Apis::BigqueryV2::TableSchema.new(fields: []) end yield @schema check_for_mutated_schema! end # Do not freeze on updater, allow modifications @schema end ## # Adds a string field to the schema. # # See {Schema#string}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.string "first_name", mode: :required # end # # @!group Schema def string name, description: nil, mode: :nullable schema.string name, description: description, mode: mode end ## # Adds an integer field to the schema. # # See {Schema#integer}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.integer "age", mode: :required # end # # @!group Schema def integer name, description: nil, mode: :nullable schema.integer name, description: description, mode: mode end ## # Adds a floating-point number field to the schema. # # See {Schema#float}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.float "price", mode: :required # end # # @!group Schema def float name, description: nil, mode: :nullable schema.float name, description: description, mode: mode end ## # Adds a boolean field to the schema. # # See {Schema#boolean}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.boolean "active", mode: :required # end # # @!group Schema def boolean name, description: nil, mode: :nullable schema.boolean name, description: description, mode: mode end ## # Adds a timestamp field to the schema. # # See {Schema#timestamp}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.timestamp "creation_date", mode: :required # end # # @!group Schema def timestamp name, description: nil, mode: :nullable schema.timestamp name, description: description, mode: mode end ## # Adds a record field to the schema. A block must be passed describing # the nested fields of the record. For more information about nested # and repeated records, see [Preparing Data for BigQuery # ](https://cloud.google.com/bigquery/preparing-data-for-bigquery). # # See {Schema#record}. # # @param [String] name The field name. The name must contain only # letters (a-z, A-Z), numbers (0-9), or underscores (_), and must # start with a letter or underscore. The maximum length is 128 # characters. # @param [String] description A description of the field. # @param [Symbol] mode The field's mode. The possible values are # `:nullable`, `:required`, and `:repeated`. The default value is # `:nullable`. # @yield [nested_schema] a block for setting the nested schema # @yieldparam [Schema] nested_schema the object accepting the # nested schema # # @example # require "google/cloud" # # gcloud = Google::Cloud.new # bigquery = gcloud.bigquery # dataset = bigquery.dataset "my_dataset" # table = dataset.create_table "my_table" do |schema| # schema.record "cities_lived", mode: :repeated do |cities_lived| # cities_lived.string "place", mode: :required # cities_lived.integer "number_of_years", mode: :required # end # end # # @!group Schema # def record name, description: nil, mode: nil, &block schema.record name, description: description, mode: mode, &block end ## # Make sure any access changes are saved def check_for_mutated_schema! return if @schema.nil? @schema.check_for_mutated_schema! return unless @schema.changed? @gapi.schema = @schema.to_gapi patch_gapi! :schema end def to_gapi check_for_mutated_schema! @gapi end protected ## # Change to a NOOP def ensure_full_data! # Do nothing because we trust the gapi is full before we get here. end ## # Queue up all the updates instead of making them. def patch_gapi! attribute @updates << attribute @updates.uniq! end end end end end end