RubyGems - google-cloud-bigquery - Versions diffs - 1.1.0 → 1.2.0 - Mend

google-cloud-bigquery 1.1.0 → 1.2.0

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (16) hide show

checksums.yaml +4 -4
data/README.md +27 -19
data/lib/google/cloud/bigquery/convert.rb +106 -13
data/lib/google/cloud/bigquery/copy_job.rb +168 -0
data/lib/google/cloud/bigquery/dataset.rb +313 -112
data/lib/google/cloud/bigquery/encryption_configuration.rb +124 -0
data/lib/google/cloud/bigquery/extract_job.rb +149 -0
data/lib/google/cloud/bigquery/job.rb +14 -3
data/lib/google/cloud/bigquery/load_job.rb +770 -0
data/lib/google/cloud/bigquery/project.rb +118 -20
data/lib/google/cloud/bigquery/query_job.rb +403 -2
data/lib/google/cloud/bigquery/schema/field.rb +22 -22
data/lib/google/cloud/bigquery/service.rb +45 -328
data/lib/google/cloud/bigquery/table.rb +375 -95
data/lib/google/cloud/bigquery/version.rb +1 -1
metadata +3 -2

data/lib/google/cloud/bigquery/encryption_configuration.rb ADDED

@@ -0,0 +1,124 @@
+# Copyright 2018 Google LLC
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+#     https://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+require "google/apis/bigquery_v2"
+module Google
+  module Cloud
+    module Bigquery
+      ##
+      # # Encryption Configuration
+      #
+      # A builder for BigQuery table encryption configurations, passed to block
+      # arguments to {Dataset#create_table} and
+      # {Table#encryption_configuration}.
+      #
+      # @see https://cloud.google.com/bigquery/docs/customer-managed-encryption
+      #   Protecting Data with Cloud KMS Keys
+      #
+      # @example
+      #   require "google/cloud/bigquery"
+      #
+      #   bigquery = Google::Cloud::Bigquery.new
+      #   dataset = bigquery.dataset "my_dataset"
+      #   key_name = "projects/a/locations/b/keyRings/c/cryptoKeys/d"
+      #   encrypt_config = bigquery.encryption kms_key: key_name
+      #   table = dataset.create_table "my_table" do |updater|
+      #     updater.encryption = encrypt_config
+      #   end
+      #
+      class EncryptionConfiguration
+        ##
+        # @private The Google API Client object.
+        attr_accessor :gapi
+        ##
+        # @private Create an empty EncryptionConfiguration object.
+        def initialize
+          @gapi = Google::Apis::BigqueryV2::EncryptionConfiguration.new
+        end
+        ##
+        # The Cloud KMS encryption key that will be used to protect the table.
+        # For example: `projects/a/locations/b/keyRings/c/cryptoKeys/d`
+        # The default value is `nil`, which means default encryption is used.
+        #
+        # @return [String]
+        #
+        # @example
+        #   require "google/cloud/bigquery"
+        #
+        #   config = Google::Cloud::Bigquery::EncryptionConfiguration.new
+        #   key_name = "projects/a/locations/b/keyRings/c/cryptoKeys/d"
+        #   config.kms_key = key_name
+        #
+        def kms_key
+          @gapi.kms_key_name
+        end
+        ##
+        # Set the Cloud KMS encryption key that will be used to protect the
+        # table. For example: `projects/a/locations/b/keyRings/c/cryptoKeys/d`
+        # The default value is `nil`, which means default encryption is used.
+        #
+        # @param [String] new_kms_key_name New Cloud KMS key name
+        #
+        # @example
+        #   require "google/cloud/bigquery"
+        #
+        #   config = Google::Cloud::Bigquery::EncryptionConfiguration.new
+        #   key_name = "projects/a/locations/b/keyRings/c/cryptoKeys/d"
+        #   config.kms_key = key_name
+        #
+        def kms_key= new_kms_key_name
+          frozen_check!
+          @gapi.kms_key_name = new_kms_key_name
+        end
+        # @private
+        def changed?
+          return false if frozen?
+          @original_json != @gapi.to_json
+        end
+        ##
+        # @private Google API Client object.
+        def to_gapi
+          @gapi
+        end
+        ##
+        # @private Google API Client object.
+        def self.from_gapi gapi
+          new_config = new
+          new_config.instance_variable_set :@gapi, gapi
+          new_config
+        end
+        # @private
+        def == other
+          return false unless other.is_a? EncryptionConfiguration
+          to_gapi.to_json == other.to_gapi.to_json
+        end
+        protected
+        def frozen_check!
+          return unless frozen?
+          raise ArgumentError, "Cannot modify a frozen encryption configuration"
+        end
+      end
+    end
+  end
+end

data/lib/google/cloud/bigquery/extract_job.rb CHANGED

@@ -155,6 +155,155 @@ module Google
         def destinations_counts
           Hash[destinations.zip destinations_file_counts]
         end
+        ##
+        # Yielded to a block to accumulate changes for an API request.
+        class Updater < ExtractJob
+          ##
+          # @private Create an Updater object.
+          def initialize gapi
+            @gapi = gapi
+          end
+          ##
+          # @private Create an Updater from an options hash.
+          #
+          # @return [Google::Cloud::Bigquery::ExtractJob::Updater] A job
+          #   configuration object for setting query options.
+          def self.from_options service, table, storage_files, options = {}
+            job_ref = service.job_ref_from options[:job_id], options[:prefix]
+            storage_urls = Array(storage_files).map do |url|
+              url.respond_to?(:to_gs_url) ? url.to_gs_url : url
+            end
+            dest_format = options[:format]
+            if dest_format.nil?
+              dest_format = Convert.derive_source_format storage_urls.first
+            end
+            req = Google::Apis::BigqueryV2::Job.new(
+              job_reference: job_ref,
+              configuration: Google::Apis::BigqueryV2::JobConfiguration.new(
+                extract: Google::Apis::BigqueryV2::JobConfigurationExtract.new(
+                  destination_uris: Array(storage_urls),
+                  source_table: table
+                ),
+                dry_run: options[:dryrun]
+              )
+            )
+            updater = ExtractJob::Updater.new req
+            updater.compression = options[:compression]
+            updater.delimiter = options[:delimiter]
+            updater.format = dest_format
+            updater.header = options[:header]
+            updater.labels = options[:labels] if options[:labels]
+            updater
+          end
+          ##
+          # Sets the geographic location where the job should run. Required
+          # except for US and EU.
+          #
+          # @param [String] value A geographic location, such as "US", "EU" or
+          #   "asia-northeast1". Required except for US and EU.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   table = dataset.table "my_table"
+          #
+          #   destination = "gs://my-bucket/file-name.csv"
+          #   extract_job = table.extract_job destination do |j|
+          #     j.location = "EU"
+          #   end
+          #
+          #   extract_job.wait_until_done!
+          #   extract_job.done? #=> true
+          #
+          # @!group Attributes
+          def location= value
+            @gapi.job_reference.location = value
+          end
+          ##
+          # Sets the compression type.
+          #
+          # @param [String] value The compression type to use for exported
+          #   files. Possible values include `GZIP` and `NONE`. The default
+          #   value is `NONE`.
+          #
+          # @!group Attributes
+          def compression= value
+            @gapi.configuration.extract.compression = value
+          end
+          ##
+          # Sets the field delimiter.
+          #
+          # @param [String] value Delimiter to use between fields in the
+          #   exported data. Default is <code>,</code>.
+          #
+          # @!group Attributes
+          def delimiter= value
+            @gapi.configuration.extract.field_delimiter = value
+          end
+          ##
+          # Sets the destination file format. The default value is `csv`.
+          #
+          # The following values are supported:
+          #
+          # * `csv` - CSV
+          # * `json` - [Newline-delimited JSON](http://jsonlines.org/)
+          # * `avro` - [Avro](http://avro.apache.org/)
+          #
+          # @param [String] new_format The new source format.
+          #
+          # @!group Attributes
+          #
+          def format= new_format
+            @gapi.configuration.extract.update! destination_format:
+              Convert.source_format(new_format)
+          end
+          ##
+          # Print a header row in the exported file.
+          #
+          # @param [Boolean] value Whether to print out a header row in the
+          #   results. Default is `true`.
+          #
+          # @!group Attributes
+          def header= value
+            @gapi.configuration.extract.print_header = value
+          end
+          ##
+          # Sets the labels to use for the job.
+          #
+          # @param [Hash] value A hash of user-provided labels associated with
+          #   the job. You can use these to organize and group your jobs. Label
+          #   keys and values can be no longer than 63 characters, can only
+          #   contain lowercase letters, numeric characters, underscores and
+          #   dashes. International characters are allowed. Label values are
+          #   optional. Label keys must start with a letter and each label in
+          #   the list must have a different key.
+          #
+          # @!group Attributes
+          #
+          def labels= value
+            @gapi.configuration.update! labels: value
+          end
+          ##
+          # @private Returns the Google API client library version of this job.
+          #
+          # @return [<Google::Apis::BigqueryV2::Job>] (See
+          #   {Google::Apis::BigqueryV2::Job})
+          def to_gapi
+            @gapi
+          end
+        end
       end
     end
   end

data/lib/google/cloud/bigquery/job.rb CHANGED

@@ -90,6 +90,17 @@ module Google
           @gapi.job_reference.project_id
         end
+        ##
+        # The geographic location where the job runs.
+        #
+        # @return [String]  A geographic location, such as "US", "EU" or
+        #   "asia-northeast1".
+        #
+        # @!group Attributes
+        def location
+          @gapi.job_reference.location
+        end
         ##
         # The email address of the user who ran the job.
         #
@@ -293,7 +304,7 @@ module Google
         #
         def cancel
           ensure_service!
-          resp = service.cancel_job job_id
+          resp = service.cancel_job job_id, location: location
           @gapi = resp.job
           true
         end
@@ -316,7 +327,7 @@ module Google
         #
         def rerun!
           ensure_service!
-          gapi = service.insert_job @gapi.configuration
+          gapi = service.insert_job @gapi.configuration, location: location
           Job.from_gapi gapi, service
         end
@@ -339,7 +350,7 @@ module Google
         #
         def reload!
           ensure_service!
-          gapi = service.get_job job_id
+          gapi = service.get_job job_id, location: location
           @gapi = gapi
         end
         alias refresh! reload!

data/lib/google/cloud/bigquery/load_job.rb CHANGED

@@ -14,6 +14,7 @@
 require "google/cloud/bigquery/service"
+require "google/cloud/bigquery/encryption_configuration"
 module Google
   module Cloud
@@ -303,6 +304,19 @@ module Google
           nil
         end
+        ##
+        # The encryption configuration of the destination table.
+        #
+        # @return [Google::Cloud::BigQuery::EncryptionConfiguration] Custom
+        #   encryption configuration (e.g., Cloud KMS keys).
+        #
+        # @!group Attributes
+        def encryption
+          EncryptionConfiguration.from_gapi(
+            @gapi.configuration.load.destination_encryption_configuration
+          )
+        end
         ##
         # The number of bytes that have been loaded into the table. While an
         # import job is in the running state, this value may change.
@@ -314,6 +328,762 @@ module Google
         rescue StandardError
           nil
         end
+        ##
+        # Yielded to a block to accumulate changes for a patch request.
+        class Updater < LoadJob
+          ##
+          # A list of attributes that were updated.
+          attr_reader :updates
+          ##
+          # @private Create an Updater object.
+          def initialize gapi
+            @updates = []
+            @gapi = gapi
+            @schema = nil
+          end
+          ##
+          # Returns the table's schema. This method can also be used to set,
+          # replace, or add to the schema by passing a block. See {Schema} for
+          # available methods.
+          #
+          # @param [Boolean] replace Whether to replace the existing schema with
+          #   the new schema. If `true`, the fields will replace the existing
+          #   schema. If `false`, the fields will be added to the existing
+          #   schema. When a table already contains data, schema changes must be
+          #   additive. Thus, the default value is `false`.
+          # @yield [schema] a block for setting the schema
+          # @yieldparam [Schema] schema the object accepting the schema
+          #
+          # @return [Google::Cloud::Bigquery::Schema]
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |j|
+          #     j.schema do |s|
+          #       s.string "first_name", mode: :required
+          #       s.record "cities_lived", mode: :repeated do |r|
+          #         r.string "place", mode: :required
+          #         r.integer "number_of_years", mode: :required
+          #       end
+          #     end
+          #   end
+          #
+          # @!group Schema
+          #
+          def schema replace: false
+            # Same as Table#schema, but not frozen
+            # TODO: make sure to call ensure_full_data! on Dataset#update
+            @schema ||= Schema.from_gapi @gapi.configuration.load.schema
+            if block_given?
+              @schema = Schema.from_gapi if replace
+              yield @schema
+              check_for_mutated_schema!
+            end
+            # Do not freeze on updater, allow modifications
+            @schema
+          end
+          ##
+          # Sets the schema of the destination table.
+          #
+          # @param [Google::Cloud::Bigquery::Schema] new_schema The schema for
+          #   the destination table. Optional. The schema can be omitted if the
+          #   destination table already exists, or if you're loading data from a
+          #   source that includes a schema, such as Avro or a Google Cloud
+          #   Datastore backup.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   schema = bigquery.schema do |s|
+          #     s.string "first_name", mode: :required
+          #     s.record "cities_lived", mode: :repeated do |nested_schema|
+          #       nested_schema.string "place", mode: :required
+          #       nested_schema.integer "number_of_years", mode: :required
+          #     end
+          #   end
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |j|
+          #     j.schema = schema
+          #   end
+          #
+          # @!group Schema
+          #
+          def schema= new_schema
+            @schema = new_schema
+          end
+          ##
+          # Adds a string field to the schema.
+          #
+          # See {Schema#string}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.string "first_name", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def string name, description: nil, mode: :nullable
+            schema.string name, description: description, mode: mode
+          end
+          ##
+          # Adds an integer field to the schema.
+          #
+          # See {Schema#integer}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.integer "age", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def integer name, description: nil, mode: :nullable
+            schema.integer name, description: description, mode: mode
+          end
+          ##
+          # Adds a floating-point number field to the schema.
+          #
+          # See {Schema#float}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.float "price", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def float name, description: nil, mode: :nullable
+            schema.float name, description: description, mode: mode
+          end
+          ##
+          # Adds a boolean field to the schema.
+          #
+          # See {Schema#boolean}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.boolean "active", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def boolean name, description: nil, mode: :nullable
+            schema.boolean name, description: description, mode: mode
+          end
+          ##
+          # Adds a bytes field to the schema.
+          #
+          # See {Schema#bytes}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.bytes "avatar", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def bytes name, description: nil, mode: :nullable
+            schema.bytes name, description: description, mode: mode
+          end
+          ##
+          # Adds a timestamp field to the schema.
+          #
+          # See {Schema#timestamp}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.timestamp "creation_date", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def timestamp name, description: nil, mode: :nullable
+            schema.timestamp name, description: description, mode: mode
+          end
+          ##
+          # Adds a time field to the schema.
+          #
+          # See {Schema#time}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.time "duration", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def time name, description: nil, mode: :nullable
+            schema.time name, description: description, mode: mode
+          end
+          ##
+          # Adds a datetime field to the schema.
+          #
+          # See {Schema#datetime}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.datetime "target_end", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def datetime name, description: nil, mode: :nullable
+            schema.datetime name, description: description, mode: mode
+          end
+          ##
+          # Adds a date field to the schema.
+          #
+          # See {Schema#date}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.date "birthday", mode: :required
+          #   end
+          #
+          # @!group Schema
+          def date name, description: nil, mode: :nullable
+            schema.date name, description: description, mode: mode
+          end
+          ##
+          # Adds a record field to the schema. A block must be passed describing
+          # the nested fields of the record. For more information about nested
+          # and repeated records, see [Preparing Data for BigQuery
+          # ](https://cloud.google.com/bigquery/preparing-data-for-bigquery).
+          #
+          # See {Schema#record}.
+          #
+          # @param [String] name The field name. The name must contain only
+          #   letters (a-z, A-Z), numbers (0-9), or underscores (_), and must
+          #   start with a letter or underscore. The maximum length is 128
+          #   characters.
+          # @param [String] description A description of the field.
+          # @param [Symbol] mode The field's mode. The possible values are
+          #   `:nullable`, `:required`, and `:repeated`. The default value is
+          #   `:nullable`.
+          # @yield [nested_schema] a block for setting the nested schema
+          # @yieldparam [Schema] nested_schema the object accepting the
+          #   nested schema
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |schema|
+          #     schema.record "cities_lived", mode: :repeated do |cities_lived|
+          #       cities_lived.string "place", mode: :required
+          #       cities_lived.integer "number_of_years", mode: :required
+          #     end
+          #   end
+          #
+          # @!group Schema
+          #
+          def record name, description: nil, mode: nil, &block
+            schema.record name, description: description, mode: mode, &block
+          end
+          ##
+          # Make sure any access changes are saved
+          def check_for_mutated_schema!
+            return if @schema.nil?
+            return unless @schema.changed?
+            @gapi.configuration.load.schema = @schema.to_gapi
+            patch_gapi! :schema
+          end
+          ##
+          # Sets the geographic location where the job should run. Required
+          # except for US and EU.
+          #
+          # @param [String] value  A geographic location, such as "US", "EU" or
+          #   "asia-northeast1". Required except for US and EU.
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |j|
+          #     j.schema do |s|
+          #       s.string "first_name", mode: :required
+          #       s.record "cities_lived", mode: :repeated do |r|
+          #         r.string "place", mode: :required
+          #         r.integer "number_of_years", mode: :required
+          #       end
+          #     end
+          #     j.location = "EU"
+          #   end
+          #
+          # @!group Attributes
+          def location= value
+            @gapi.job_reference.location = value
+          end
+          ##
+          # Sets the source file format. The default value is `csv`.
+          #
+          # The following values are supported:
+          #
+          # * `csv` - CSV
+          # * `json` - [Newline-delimited JSON](http://jsonlines.org/)
+          # * `avro` - [Avro](http://avro.apache.org/)
+          # * `datastore_backup` - Cloud Datastore backup
+          #
+          # @param [String] new_format The new source format.
+          #
+          # @!group Attributes
+          #
+          def format= new_format
+            @gapi.configuration.load.update! source_format:
+              Convert.source_format(new_format)
+          end
+          ##
+          # Sets the create disposition.
+          #
+          # This specifies whether the job is allowed to create new tables. The
+          # default value is `needed`.
+          #
+          # The following values are supported:
+          #
+          # * `needed` - Create the table if it does not exist.
+          # * `never` - The table must already exist. A 'notFound' error is
+          #             raised if the table does not exist.
+          #
+          # @param [String] new_create The new create disposition.
+          #
+          # @!group Attributes
+          #
+          def create= new_create
+            @gapi.configuration.load.update! create_disposition:
+              Convert.create_disposition(new_create)
+          end
+          ##
+          # Sets the write disposition.
+          #
+          # This specifies how to handle data already present in the table. The
+          # default value is `append`.
+          #
+          # The following values are supported:
+          #
+          # * `truncate` - BigQuery overwrites the table data.
+          # * `append` - BigQuery appends the data to the table.
+          # * `empty` - An error will be returned if the table already contains
+          #   data.
+          #
+          # @param [String] new_write The new write disposition.
+          #
+          # @!group Attributes
+          #
+          def write= new_write
+            @gapi.configuration.load.update! write_disposition:
+              Convert.write_disposition(new_write)
+          end
+          ##
+          # Sets the projection fields.
+          #
+          # If the `format` option is set to `datastore_backup`, indicates
+          # which entity properties to load from a Cloud Datastore backup.
+          # Property names are case sensitive and must be top-level properties.
+          # If not set, BigQuery loads all properties. If any named property
+          # isn't found in the Cloud Datastore backup, an invalid error is
+          # returned.
+          #
+          # @param [Array<String>] new_fields The new projection fields.
+          #
+          # @!group Attributes
+          #
+          def projection_fields= new_fields
+            if new_fields.nil?
+              @gapi.configuration.load.update! projection_fields: nil
+            else
+              @gapi.configuration.load.update! projection_fields:
+                Array(new_fields)
+            end
+          end
+          ##
+          # Sets the source URIs to load.
+          #
+          # The fully-qualified URIs that point to your data in Google Cloud.
+          #
+          # * For Google Cloud Storage URIs: Each URI can contain one '*'
+          #   wildcard character and it must come after the 'bucket' name. Size
+          #   limits related to load jobs apply to external data sources. For
+          # * Google Cloud Bigtable URIs: Exactly one URI can be specified and
+          #   it has be a fully specified and valid HTTPS URL for a Google Cloud
+          #   Bigtable table.
+          # * For Google Cloud Datastore backups: Exactly one URI can be
+          #   specified. Also, the '*' wildcard character is not allowed.
+          #
+          # @param [Array<String>] new_uris The new source URIs to load.
+          #
+          # @!group Attributes
+          #
+          def source_uris= new_uris
+            if new_uris.nil?
+              @gapi.configuration.load.update! source_uris: nil
+            else
+              @gapi.configuration.load.update! source_uris: Array(new_uris)
+            end
+          end
+          ##
+          # Sets flag for allowing jagged rows.
+          #
+          # Accept rows that are missing trailing optional columns. The missing
+          # values are treated as nulls. If `false`, records with missing
+          # trailing columns are treated as bad records, and if there are too
+          # many bad records, an invalid error is returned in the job result.
+          # The default value is `false`. Only applicable to CSV, ignored for
+          # other formats.
+          #
+          # @param [Boolean] val Accept rows that are missing trailing optional
+          #   columns.
+          #
+          # @!group Attributes
+          #
+          def jagged_rows= val
+            @gapi.configuration.load.update! allow_jagged_rows: val
+          end
+          ##
+          # Allows quoted data sections to contain newline characters in CSV.
+          #
+          # @param [Boolean] val Indicates if BigQuery should allow quoted data
+          #   sections that contain newline characters in a CSV file. The
+          #   default value is `false`.
+          #
+          # @!group Attributes
+          #
+          def quoted_newlines= val
+            @gapi.configuration.load.update! allow_quoted_newlines: val
+          end
+          ##
+          # Allows BigQuery to autodetect the schema.
+          #
+          # @param [Boolean] val Indicates if BigQuery should automatically
+          #   infer the options and schema for CSV and JSON sources. The default
+          #   value is `false`.
+          #
+          # @!group Attributes
+          #
+          def autodetect= val
+            @gapi.configuration.load.update! autodetect: val
+          end
+          ##
+          # Sets the character encoding of the data.
+          #
+          # @param [String] val The character encoding of the data. The
+          #   supported values are `UTF-8` or `ISO-8859-1`. The default value
+          #   is `UTF-8`.
+          #
+          # @!group Attributes
+          #
+          def encoding= val
+            @gapi.configuration.load.update! encoding: val
+          end
+          ##
+          # Sets the separator for fields in a CSV file.
+          #
+          # @param [String] val Specifices the separator for fields in a CSV
+          #   file. BigQuery converts the string to `ISO-8859-1` encoding, and
+          #   then uses the first byte of the encoded string to split the data
+          #   in its raw, binary state. Default is <code>,</code>.
+          #
+          # @!group Attributes
+          #
+          def delimiter= val
+            @gapi.configuration.load.update! field_delimiter: val
+          end
+          ##
+          # Allows unknown columns to be ignored.
+          #
+          # @param [Boolean] val Indicates if BigQuery should allow extra
+          #   values that are not represented in the table schema. If true, the
+          #   extra values are ignored. If false, records with extra columns are
+          #   treated as bad records, and if there are too many bad records, an
+          #   invalid error is returned in the job result. The default value is
+          #   `false`.
+          #
+          #   The `format` property determines what BigQuery treats as an extra
+          #   value:
+          #
+          #   * `CSV`: Trailing columns
+          #   * `JSON`: Named values that don't match any column names
+          #
+          # @!group Attributes
+          #
+          def ignore_unknown= val
+            @gapi.configuration.load.update! ignore_unknown_values: val
+          end
+          ##
+          # Sets the maximum number of bad records that can be ignored.
+          #
+          # @param [Integer] val The maximum number of bad records that
+          #   BigQuery can ignore when running the job. If the number of bad
+          #   records exceeds this value, an invalid error is returned in the
+          #   job result. The default value is `0`, which requires that all
+          #   records are valid.
+          #
+          # @!group Attributes
+          #
+          def max_bad_records= val
+            @gapi.configuration.load.update! max_bad_records: val
+          end
+          ##
+          # Sets the string that represents a null value in a CSV file.
+          #
+          # @param [String] val Specifies a string that represents a null value
+          #   in a CSV file. For example, if you specify `\N`, BigQuery
+          #   interprets `\N` as a null value when loading a CSV file. The
+          #   default value is the empty string. If you set this property to a
+          #   custom value, BigQuery throws an error if an empty string is
+          #   present for all data types except for STRING and BYTE. For STRING
+          #   and BYTE columns, BigQuery interprets the empty string as an empty
+          #   value.
+          #
+          # @!group Attributes
+          #
+          def null_marker= val
+            @gapi.configuration.load.update! null_marker: val
+          end
+          ##
+          # Sets the character to use to quote string values in CSVs.
+          #
+          # @param [String] val The value that is used to quote data sections
+          #   in a CSV file. BigQuery converts the string to ISO-8859-1
+          #   encoding, and then uses the first byte of the encoded string to
+          #   split the data in its raw, binary state. The default value is a
+          #   double-quote <code>"</code>. If your data does not contain quoted
+          #   sections, set the property value to an empty string. If your data
+          #   contains quoted newline characters, you must also set the
+          #   allowQuotedNewlines property to true.
+          #
+          # @!group Attributes
+          #
+          def quote= val
+            @gapi.configuration.load.update! quote: val
+          end
+          ##
+          # Sets the number of leading rows to skip in the file.
+          #
+          # @param [Integer] val The number of rows at the top of a CSV file
+          #   that BigQuery will skip when loading the data. The default
+          #   value is `0`. This property is useful if you have header rows in
+          #   the file that should be skipped.
+          #
+          # @!group Attributes
+          #
+          def skip_leading= val
+            @gapi.configuration.load.update! skip_leading_rows: val
+          end
+          ##
+          # Sets the encryption configuration of the destination table.
+          #
+          # @param [Google::Cloud::BigQuery::EncryptionConfiguration] val
+          #   Custom encryption configuration (e.g., Cloud KMS keys).
+          #
+          # @example
+          #   require "google/cloud/bigquery"
+          #
+          #   bigquery = Google::Cloud::Bigquery.new
+          #   dataset = bigquery.dataset "my_dataset"
+          #
+          #   key_name = "projects/a/locations/b/keyRings/c/cryptoKeys/d"
+          #   encrypt_config = bigquery.encryption kms_key: key_name
+          #   job = dataset.load_job "my_table", "gs://abc/file" do |job|
+          #     job.encryption = encrypt_config
+          #   end
+          #
+          # @!group Attributes
+          def encryption= val
+            @gapi.configuration.load.update!(
+              destination_encryption_configuration: val.to_gapi
+            )
+          end
+          ##
+          # Sets the labels to use for the load job.
+          #
+          # @param [Hash] val A hash of user-provided labels associated with
+          #   the job. You can use these to organize and group your jobs. Label
+          #   keys and values can be no longer than 63 characters, can only
+          #   contain lowercase letters, numeric characters, underscores and
+          #   dashes. International characters are allowed. Label values are
+          #   optional. Label keys must start with a letter and each label in
+          #   the list must have a different key.
+          #
+          # @!group Attributes
+          #
+          def labels= val
+            @gapi.configuration.update! labels: val
+          end
+          ##
+          # @private Returns the Google API client library version of this job.
+          #
+          # @return [<Google::Apis::BigqueryV2::Job>] (See
+          #   {Google::Apis::BigqueryV2::Job})
+          def to_gapi
+            check_for_mutated_schema!
+            @gapi
+          end
+          protected
+          ##
+          # Change to a NOOP
+          def ensure_full_data!
+            # Do nothing because we trust the gapi is full before we get here.
+          end
+          ##
+          # Queue up all the updates instead of making them.
+          def patch_gapi! attribute
+            @updates << attribute
+            @updates.uniq!
+          end
+        end
       end
     end
   end