Class: Gcloud::Bigquery::Service

Inherits:

Object

Object
Gcloud::Bigquery::Service

show all

Defined in:: lib/gcloud/bigquery/service.rb

Constant Summary collapse

API = Alias to the Google Client API module

Google::Apis::BigqueryV2

Instance Attribute Summary collapse

#credentials ⇒ Object
#mocked_service ⇒ Object

Returns the value of attribute mocked_service.
#project ⇒ Object

Class Method Summary collapse

.table_ref_from_s(str, default_table_ref) ⇒ Object

Extracts at least ‘tbl` group, and possibly `dts` and `prj` groups, from strings in the formats: “my_table”, “my_dataset.my_table”, or “my-project:my_dataset.my_table”.

Instance Method Summary collapse

#copy_table(source, target, options = {}) ⇒ Object
#delete_dataset(dataset_id, force = nil) ⇒ Object

Deletes the dataset specified by the datasetId value.
#delete_table(dataset_id, table_id) ⇒ Object

Deletes the table specified by tableId from the dataset.
#extract_table(table, storage_files, options = {}) ⇒ Object
#get_dataset(dataset_id) ⇒ Object

Returns the dataset specified by datasetID.
#get_job(job_id) ⇒ Object

Returns the job specified by jobID.
#get_project_table(project_id, dataset_id, table_id) ⇒ Object
#get_table(dataset_id, table_id) ⇒ Object

Gets the specified table resource by table ID.
#initialize(project, credentials, retries: nil, timeout: nil) ⇒ Service constructor

Creates a new Service instance.
#insert_dataset(new_dataset_gapi) ⇒ Object

Creates a new empty dataset.
#insert_job(config) ⇒ Object
#insert_table(dataset_id, new_table_gapi) ⇒ Object

Creates a new, empty table in the dataset.
#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ Object
#inspect ⇒ Object
#job_query_results(job_id, options = {}) ⇒ Object

Returns the query data for the job.
#list_datasets(options = {}) ⇒ Object

Lists all datasets in the specified project to which you have been granted the READER dataset role.
#list_jobs(options = {}) ⇒ Object

Lists all jobs in the specified project to which you have been granted the READER job role.
#list_tabledata(dataset_id, table_id, options = {}) ⇒ Object

Retrieves data from the table.
#list_tables(dataset_id, options = {}) ⇒ Object

Lists all tables in the specified dataset.
#load_table_file(dataset_id, table_id, file, options = {}) ⇒ Object
#load_table_gs_url(dataset_id, table_id, url, options = {}) ⇒ Object
#patch_dataset(dataset_id, patched_dataset_gapi) ⇒ Object

Updates information in an existing dataset, only replacing fields that are provided in the submitted dataset resource.
#patch_table(dataset_id, table_id, patched_table_gapi) ⇒ Object

Updates information in an existing table, replacing fields that are provided in the submitted table resource.
#query(query, options = {}) ⇒ Object
#query_job(query, options = {}) ⇒ Object
#service ⇒ Object

Constructor Details

#initialize(project, credentials, retries: nil, timeout: nil) ⇒ `Service`

Creates a new Service instance.

# File 'lib/gcloud/bigquery/service.rb', line 40

def initialize project, credentials, retries: nil, timeout: nil
  @project = project
  @credentials = credentials
  @credentials = credentials
  @service = API::BigqueryService.new
  @service.client_options.application_name    = "gcloud-ruby"
  @service.client_options.application_version = Gcloud::VERSION
  @service.request_options.retries = retries || 3
  @service.request_options.timeout_sec = timeout if timeout
  @service.authorization = @credentials.client
end

Instance Attribute Details

#credentials ⇒ `Object`



36
37
38

# File 'lib/gcloud/bigquery/service.rb', line 36

def credentials
  @credentials
end

#mocked_service ⇒ `Object`

Returns the value of attribute mocked_service.



56
57
58

# File 'lib/gcloud/bigquery/service.rb', line 56

def mocked_service
  @mocked_service
end

#project ⇒ `Object`



33
34
35

# File 'lib/gcloud/bigquery/service.rb', line 33

def project
  @project
end

Class Method Details

.table_ref_from_s(str, default_table_ref) ⇒ `Object`

Extracts at least ‘tbl` group, and possibly `dts` and `prj` groups, from strings in the formats: “my_table”, “my_dataset.my_table”, or “my-project:my_dataset.my_table”. Then merges project_id and dataset_id from the default table if they are missing.

# File 'lib/gcloud/bigquery/service.rb', line 277

def self.table_ref_from_s str, default_table_ref
  str = str.to_s
  m = /\A(((?<prj>\S*):)?(?<dts>\S*)\.)?(?<tbl>\S*)\z/.match str
  unless m
    fail ArgumentError, "unable to identify table from #{str.inspect}"
  end
  str_table_ref_hash = {
    project_id: m["prj"],
    dataset_id: m["dts"],
    table_id:   m["tbl"]
  }.delete_if { |_, v| v.nil? }
  new_table_ref_hash = default_table_ref.to_h.merge str_table_ref_hash
  Google::Apis::BigqueryV2::TableReference.new new_table_ref_hash
end

Instance Method Details

#copy_table(source, target, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 244

def copy_table source, target, options = {}
  service.insert_job @project, copy_table_config(source, target, options)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#delete_dataset(dataset_id, force = nil) ⇒ `Object`

Deletes the dataset specified by the datasetId value. Before you can delete a dataset, you must delete all its tables, either manually or by specifying force: true in options. Immediately after deletion, you can create another dataset with the same name.

# File 'lib/gcloud/bigquery/service.rb', line 100

def delete_dataset dataset_id, force = nil
  service.delete_dataset @project, dataset_id, delete_contents: force
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#delete_table(dataset_id, table_id) ⇒ `Object`

Deletes the table specified by tableId from the dataset. If the table contains data, all the data will be deleted.

# File 'lib/gcloud/bigquery/service.rb', line 153

def delete_table dataset_id, table_id
  service.delete_table @project, dataset_id, table_id
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#extract_table(table, storage_files, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 250

def extract_table table, storage_files, options = {}
  service.insert_job \
    @project, extract_table_config(table, storage_files, options)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#get_dataset(dataset_id) ⇒ `Object`

Returns the dataset specified by datasetID.

# File 'lib/gcloud/bigquery/service.rb', line 71

def get_dataset dataset_id
  service.get_dataset @project, dataset_id
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#get_job(job_id) ⇒ `Object`

Returns the job specified by jobID.

# File 'lib/gcloud/bigquery/service.rb', line 203

def get_job job_id
  service.get_job @project, job_id
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#get_project_table(project_id, dataset_id, table_id) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 116

def get_project_table project_id, dataset_id, table_id
  service.get_table project_id, dataset_id, table_id
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#get_table(dataset_id, table_id) ⇒ `Object`

Gets the specified table resource by table ID. This method does not return the data in the table, it only returns the table resource, which describes the structure of this table.

# File 'lib/gcloud/bigquery/service.rb', line 127

def get_table dataset_id, table_id
  get_project_table @project, dataset_id, table_id
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#insert_dataset(new_dataset_gapi) ⇒ `Object`

Creates a new empty dataset.

# File 'lib/gcloud/bigquery/service.rb', line 79

def insert_dataset new_dataset_gapi
  service.insert_dataset @project, new_dataset_gapi
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#insert_job(config) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 209

def insert_job config
  job_object = API::Job.new(
    configuration: config
  )
  service.insert_job @project, job_object
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#insert_table(dataset_id, new_table_gapi) ⇒ `Object`

Creates a new, empty table in the dataset.

# File 'lib/gcloud/bigquery/service.rb', line 135

def insert_table dataset_id, new_table_gapi
  service.insert_table @project, dataset_id, new_table_gapi
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 170

def insert_tabledata dataset_id, table_id, rows, options = {}
  insert_rows = Array(rows).map do |row|
    Google::Apis::BigqueryV2::InsertAllTableDataRequest::Row.new(
      insert_id: Digest::MD5.base64digest(row.inspect),
      # Hash[row.map{|(k,v)| [k.to_s,v]}] for Hash<String,Object>
      json: row
    )
  end
  insert_req = Google::Apis::BigqueryV2::InsertAllTableDataRequest.new(
    rows: insert_rows,
    ignore_unknown_values: options[:ignore_unknown],
    skip_invalid_rows: options[:skip_invalid]
  )

  service.insert_all_table_data @project, dataset_id, table_id, insert_req
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#inspect ⇒ `Object`



292
293
294

# File 'lib/gcloud/bigquery/service.rb', line 292

def inspect
  "#{self.class}(#{@project})"
end

#job_query_results(job_id, options = {}) ⇒ `Object`

Returns the query data for the job

# File 'lib/gcloud/bigquery/service.rb', line 233

def job_query_results job_id, options = {}
  service.get_job_query_results @project,
                                job_id,
                                max_results: options.delete(:max),
                                page_token: options.delete(:token),
                                start_index: options.delete(:start),
                                timeout_ms: options.delete(:timeout)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#list_datasets(options = {}) ⇒ `Object`

Lists all datasets in the specified project to which you have been granted the READER dataset role.

# File 'lib/gcloud/bigquery/service.rb', line 61

def list_datasets options = {}
  service.list_datasets \
    @project, all: options[:all], max_results: options[:max],
              page_token: options[:token]
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#list_jobs(options = {}) ⇒ `Object`

Lists all jobs in the specified project to which you have been granted the READER job role.

# File 'lib/gcloud/bigquery/service.rb', line 192

def list_jobs options = {}
  service.list_jobs \
    @project, all_users: options[:all], max_results: options[:max],
              page_token: options[:token], projection: "full",
              state_filter: options[:filter]
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#list_tabledata(dataset_id, table_id, options = {}) ⇒ `Object`

Retrieves data from the table.

# File 'lib/gcloud/bigquery/service.rb', line 161

def list_tabledata dataset_id, table_id, options = {}
  service.list_table_data @project, dataset_id, table_id,
                          max_results: options.delete(:max),
                          page_token: options.delete(:token),
                          start_index: options.delete(:start)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#list_tables(dataset_id, options = {}) ⇒ `Object`

Lists all tables in the specified dataset. Requires the READER dataset role.

# File 'lib/gcloud/bigquery/service.rb', line 109

def list_tables dataset_id, options = {}
  service.list_tables @project, dataset_id, max_results: options[:max],
                                            page_token: options[:token]
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#load_table_file(dataset_id, table_id, file, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 264

def load_table_file dataset_id, table_id, file, options = {}
  service.insert_job \
    @project, load_table_file_config(dataset_id, table_id, file, options),
    upload_source: file, content_type: mime_type_for(file)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#load_table_gs_url(dataset_id, table_id, url, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 257

def load_table_gs_url dataset_id, table_id, url, options = {}
  service.insert_job \
    @project, load_table_url_config(dataset_id, table_id, url, options)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#patch_dataset(dataset_id, patched_dataset_gapi) ⇒ `Object`

Updates information in an existing dataset, only replacing fields that are provided in the submitted dataset resource.

# File 'lib/gcloud/bigquery/service.rb', line 88

def patch_dataset dataset_id, patched_dataset_gapi
  service.patch_dataset @project, dataset_id, patched_dataset_gapi
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#patch_table(dataset_id, table_id, patched_table_gapi) ⇒ `Object`

Updates information in an existing table, replacing fields that are provided in the submitted table resource.

# File 'lib/gcloud/bigquery/service.rb', line 144

def patch_table dataset_id, table_id, patched_table_gapi
  service.patch_table @project, dataset_id, table_id, patched_table_gapi
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#query(query, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 225

def query query, options = {}
  service.query_job @project, query_config(query, options)
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#query_job(query, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 218

def query_job query, options = {}
  config = query_table_config(query, options)
  service.insert_job @project, config
rescue Google::Apis::Error => e
  raise Gcloud::Error.from_error(e)
end

#service ⇒ `Object`

# File 'lib/gcloud/bigquery/service.rb', line 52

def service
  return mocked_service if mocked_service
  @service
end

Class: Gcloud::Bigquery::Service

Constant Summary collapse

Instance Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(project, credentials, retries: nil, timeout: nil) ⇒ Service

Instance Attribute Details

#credentials ⇒ Object

#mocked_service ⇒ Object

#project ⇒ Object

Class Method Details

.table_ref_from_s(str, default_table_ref) ⇒ Object

Instance Method Details

#copy_table(source, target, options = {}) ⇒ Object

#delete_dataset(dataset_id, force = nil) ⇒ Object

#delete_table(dataset_id, table_id) ⇒ Object

#extract_table(table, storage_files, options = {}) ⇒ Object

#get_dataset(dataset_id) ⇒ Object

#get_job(job_id) ⇒ Object

#get_project_table(project_id, dataset_id, table_id) ⇒ Object

#get_table(dataset_id, table_id) ⇒ Object

#insert_dataset(new_dataset_gapi) ⇒ Object

#insert_job(config) ⇒ Object

#insert_table(dataset_id, new_table_gapi) ⇒ Object

#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ Object

#inspect ⇒ Object

#job_query_results(job_id, options = {}) ⇒ Object

#list_datasets(options = {}) ⇒ Object

#list_jobs(options = {}) ⇒ Object

#list_tabledata(dataset_id, table_id, options = {}) ⇒ Object

#list_tables(dataset_id, options = {}) ⇒ Object

#load_table_file(dataset_id, table_id, file, options = {}) ⇒ Object

#load_table_gs_url(dataset_id, table_id, url, options = {}) ⇒ Object

#patch_dataset(dataset_id, patched_dataset_gapi) ⇒ Object

#patch_table(dataset_id, table_id, patched_table_gapi) ⇒ Object

#query(query, options = {}) ⇒ Object

#query_job(query, options = {}) ⇒ Object

#service ⇒ Object