Class: Gcloud::Bigquery::Connection

Inherits:

Object

Object
Gcloud::Bigquery::Connection

show all

Defined in:: lib/gcloud/bigquery/connection.rb

Overview

as well as expose the API calls.

Constant Summary collapse

API_VERSION =

"v2"

Instance Attribute Summary collapse

#credentials ⇒ Object

Returns the value of attribute credentials.
#project ⇒ Object

Returns the value of attribute project.

Class Method Summary collapse

.table_ref_from_s(str, default_table_ref) ⇒ Object

Extracts at least tbl group, and possibly dts and prj groups, from strings in the formats: “my_table”, “my_dataset.my_table”, or “my-project:my_dataset.my_table”.

Instance Method Summary collapse

#copy_table(source, target, options = {}) ⇒ Object
#default_access_rules ⇒ Object
#delete_dataset(dataset_id, force = nil) ⇒ Object

Deletes the dataset specified by the datasetId value.
#delete_table(dataset_id, table_id) ⇒ Object

Deletes the table specified by tableId from the dataset.
#extract_table(table, storage_files, options = {}) ⇒ Object
#get_dataset(dataset_id) ⇒ Object

Returns the dataset specified by datasetID.
#get_job(job_id) ⇒ Object

Returns the job specified by jobID.
#get_project_table(project_id, dataset_id, table_id) ⇒ Object
#get_table(dataset_id, table_id) ⇒ Object

Gets the specified table resource by table ID.
#initialize(project, credentials) ⇒ Connection constructor

Creates a new Connection instance.
#insert_dataset(dataset_id, options = {}) ⇒ Object

Creates a new empty dataset.
#insert_job(config) ⇒ Object
#insert_table(dataset_id, table_id, options = {}) ⇒ Object

Creates a new, empty table in the dataset.
#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ Object
#inspect ⇒ Object
#job_query_results(job_id, options = {}) ⇒ Object

Returns the query data for the job.
#link_table(table, urls, options = {}) ⇒ Object
#list_datasets(options = {}) ⇒ Object

Lists all datasets in the specified project to which you have been granted the READER dataset role.
#list_jobs(options = {}) ⇒ Object

Lists all jobs in the specified project to which you have been granted the READER job role.
#list_tabledata(dataset_id, table_id, options = {}) ⇒ Object

Retrieves data from the table.
#list_tables(dataset_id, options = {}) ⇒ Object

Lists all tables in the specified dataset.
#load_multipart(table, file, options = {}) ⇒ Object
#load_resumable(table, file, chunk_size = nil, options = {}) ⇒ Object
#load_table(table, storage_url, options = {}) ⇒ Object
#patch_dataset(dataset_id, options = {}) ⇒ Object

Updates information in an existing dataset, only replacing fields that are provided in the submitted dataset resource.
#patch_table(dataset_id, table_id, options = {}) ⇒ Object

Updates information in an existing table, replacing fields that are provided in the submitted table resource.
#query(query, options = {}) ⇒ Object
#query_job(query, options = {}) ⇒ Object

Constructor Details

#initialize(project, credentials) ⇒ `Connection`

Creates a new Connection instance.

# File 'lib/gcloud/bigquery/connection.rb', line 35

def initialize project, credentials
  @project = project
  @credentials = credentials
  @client = Google::APIClient.new application_name:    "gcloud-ruby",
                                  application_version: Gcloud::VERSION
  @client.authorization = @credentials.client
  @bigquery = @client.discovered_api "bigquery", API_VERSION
end

Instance Attribute Details

#credentials ⇒ `Object`

Returns the value of attribute credentials.



31
32
33

# File 'lib/gcloud/bigquery/connection.rb', line 31

def credentials
  @credentials
end

#project ⇒ `Object`

Returns the value of attribute project.



30
31
32

# File 'lib/gcloud/bigquery/connection.rb', line 30

def project
  @project
end

Class Method Details

.table_ref_from_s(str, default_table_ref) ⇒ `Object`

Extracts at least tbl group, and possibly dts and prj groups, from strings in the formats: “my_table”, “my_dataset.my_table”, or “my-project:my_dataset.my_table”. Then merges project_id and dataset_id from the default table if they are missing.

# File 'lib/gcloud/bigquery/connection.rb', line 330

def self.table_ref_from_s str, default_table_ref
  str = str.to_s
  m = /\A(((?<prj>\S*):)?(?<dts>\S*)\.)?(?<tbl>\S*)\z/.match str
  unless m
    fail ArgumentError, "unable to identify table from #{str.inspect}"
  end
  str_table_ref = { "projectId" => m["prj"],
                    "datasetId" => m["dts"],
                    "tableId"   => m["tbl"] }.delete_if { |_, v| v.nil? }
  default_table_ref.merge str_table_ref
end

Instance Method Details

#copy_table(source, target, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 258

def copy_table source, target, options = {}
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: copy_table_config(source, target, options)
  )
end

#default_access_rules ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 316

def default_access_rules
  [
    { "role" => "OWNER",  "specialGroup" => "projectOwners" },
    { "role" => "WRITER", "specialGroup" => "projectWriters" },
    { "role" => "READER", "specialGroup" => "projectReaders" },
    { "role" => "OWNER",  "userByEmail"  => credentials.issuer }
  ]
end

#delete_dataset(dataset_id, force = nil) ⇒ `Object`

Deletes the dataset specified by the datasetId value. Before you can delete a dataset, you must delete all its tables, either manually or by specifying force: true in options. Immediately after deletion, you can create another dataset with the same name.

# File 'lib/gcloud/bigquery/connection.rb', line 98

def delete_dataset dataset_id, force = nil
  execute(
    api_method: @bigquery.datasets.delete,
    parameters: { projectId: @project, datasetId: dataset_id,
                  deleteContents: force
                }.delete_if { |_, v| v.nil? }
  )
end

#delete_table(dataset_id, table_id) ⇒ `Object`

Deletes the table specified by tableId from the dataset. If the table contains data, all the data will be deleted.

# File 'lib/gcloud/bigquery/connection.rb', line 165

def delete_table dataset_id, table_id
  execute(
    api_method: @bigquery.tables.delete,
    parameters: { projectId: @project, datasetId: dataset_id,
                  tableId: table_id }
  )
end

#extract_table(table, storage_files, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 274

def extract_table table, storage_files, options = {}
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: extract_table_config(table, storage_files, options)
  )
end

#get_dataset(dataset_id) ⇒ `Object`

Returns the dataset specified by datasetID.

# File 'lib/gcloud/bigquery/connection.rb', line 62

def get_dataset dataset_id
  execute(
    api_method: @bigquery.datasets.get,
    parameters: { projectId: @project, datasetId: dataset_id }
  )
end

#get_job(job_id) ⇒ `Object`

Returns the job specified by jobID.

# File 'lib/gcloud/bigquery/connection.rb', line 211

def get_job job_id
  execute(
    api_method: @bigquery.jobs.get,
    parameters: { projectId: @project, jobId: job_id }
  )
end

#get_project_table(project_id, dataset_id, table_id) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 123

def get_project_table project_id, dataset_id, table_id
  execute(
    api_method: @bigquery.tables.get,
    parameters: { projectId: project_id, datasetId: dataset_id,
                  tableId: table_id }
  )
end

#get_table(dataset_id, table_id) ⇒ `Object`

Gets the specified table resource by table ID. This method does not return the data in the table, it only returns the table resource, which describes the structure of this table.



136
137
138

# File 'lib/gcloud/bigquery/connection.rb', line 136

def get_table dataset_id, table_id
  get_project_table @project, dataset_id, table_id
end

#insert_dataset(dataset_id, options = {}) ⇒ `Object`

Creates a new empty dataset.

# File 'lib/gcloud/bigquery/connection.rb', line 71

def insert_dataset dataset_id, options = {}
  execute(
    api_method: @bigquery.datasets.insert,
    parameters: { projectId: @project },
    body_object: insert_dataset_request(dataset_id, options)
  )
end

#insert_job(config) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 218

def insert_job config
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: { "configuration" => config }
  )
end

#insert_table(dataset_id, table_id, options = {}) ⇒ `Object`

Creates a new, empty table in the dataset.

# File 'lib/gcloud/bigquery/connection.rb', line 142

def insert_table dataset_id, table_id, options = {}
  execute(
    api_method: @bigquery.tables.insert,
    parameters: { projectId: @project, datasetId: dataset_id },
    body_object: insert_table_request(dataset_id, table_id, options)
  )
end

#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 189

def insert_tabledata dataset_id, table_id, rows, options = {}
  execute(
    api_method: @bigquery.tabledata.insert_all,
    parameters: { projectId: @project,
                  datasetId: dataset_id,
                  tableId: table_id },
    body_object: insert_tabledata_rows(rows, options)
  )
end

#inspect ⇒ `Object`



342
343
344

# File 'lib/gcloud/bigquery/connection.rb', line 342

def inspect
  "#{self.class}(#{@project})"
end

#job_query_results(job_id, options = {}) ⇒ `Object`

Returns the query data for the job

# File 'lib/gcloud/bigquery/connection.rb', line 244

def job_query_results job_id, options = {}
  params = { projectId: @project, jobId: job_id,
             pageToken: options.delete(:token),
             maxResults: options.delete(:max),
             startIndex: options.delete(:start),
             timeoutMs: options.delete(:timeout)
           }.delete_if { |_, v| v.nil? }

  execute(
    api_method: @bigquery.jobs.get_query_results,
    parameters: params
  )
end

#link_table(table, urls, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 266

def link_table table, urls, options = {}
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: link_table_config(table, urls, options)
  )
end

#list_datasets(options = {}) ⇒ `Object`

Lists all datasets in the specified project to which you have been granted the READER dataset role.

# File 'lib/gcloud/bigquery/connection.rb', line 47

def list_datasets options = {}
  params = { projectId: @project,
             all: options.delete(:all),
             pageToken: options.delete(:token),
             maxResults: options.delete(:max)
           }.delete_if { |_, v| v.nil? }

  execute(
    api_method: @bigquery.datasets.list,
    parameters: params
  )
end

#list_jobs(options = {}) ⇒ `Object`

Lists all jobs in the specified project to which you have been granted the READER job role.

# File 'lib/gcloud/bigquery/connection.rb', line 202

def list_jobs options = {}
  execute(
    api_method: @bigquery.jobs.list,
    parameters: list_jobs_params(options)
  )
end

#list_tabledata(dataset_id, table_id, options = {}) ⇒ `Object`

Retrieves data from the table.

# File 'lib/gcloud/bigquery/connection.rb', line 175

def list_tabledata dataset_id, table_id, options = {}
  params = { projectId: @project,
             datasetId: dataset_id, tableId: table_id,
             pageToken: options.delete(:token),
             maxResults: options.delete(:max),
             startIndex: options.delete(:start)
           }.delete_if { |_, v| v.nil? }

  execute(
    api_method: @bigquery.tabledata.list,
    parameters: params
  )
end

#list_tables(dataset_id, options = {}) ⇒ `Object`

Lists all tables in the specified dataset. Requires the READER dataset role.

# File 'lib/gcloud/bigquery/connection.rb', line 110

def list_tables dataset_id, options = {}
  params = { projectId: @project,
             datasetId: dataset_id,
             pageToken: options.delete(:token),
             maxResults: options.delete(:max)
           }.delete_if { |_, v| v.nil? }

  execute(
    api_method: @bigquery.tables.list,
    parameters: params
  )
end

#load_multipart(table, file, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 291

def load_multipart table, file, options = {}
  media = load_media file

  execute(
    api_method: @bigquery.jobs.insert,
    media: media,
    parameters: { projectId: @project, uploadType: "multipart" },
    body_object: load_table_config(table, nil, file, options)
  )
end

#load_resumable(table, file, chunk_size = nil, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 302

def load_resumable table, file, chunk_size = nil, options = {}
  media = load_media file, chunk_size

  result = execute(
    api_method: @bigquery.jobs.insert,
    media: media,
    parameters: { projectId: @project, uploadType: "resumable" },
    body_object: load_table_config(table, nil, file, options)
  )
  upload = result.resumable_upload
  result = execute upload while upload.resumable?
  result
end

#load_table(table, storage_url, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 282

def load_table table, storage_url, options = {}
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: load_table_config(table, storage_url,
                                   Array(storage_url).first, options)
  )
end

#patch_dataset(dataset_id, options = {}) ⇒ `Object`

Updates information in an existing dataset, only replacing fields that are provided in the submitted dataset resource.

# File 'lib/gcloud/bigquery/connection.rb', line 82

def patch_dataset dataset_id, options = {}
  project_id = options[:project_id] || @project

  execute(
    api_method: @bigquery.datasets.patch,
    parameters: { projectId: project_id, datasetId: dataset_id },
    body_object: patch_dataset_request(options)
  )
end

#patch_table(dataset_id, table_id, options = {}) ⇒ `Object`

Updates information in an existing table, replacing fields that are provided in the submitted table resource.

# File 'lib/gcloud/bigquery/connection.rb', line 153

def patch_table dataset_id, table_id, options = {}
  execute(
    api_method: @bigquery.tables.patch,
    parameters: { projectId: @project, datasetId: dataset_id,
                  tableId: table_id },
    body_object: patch_table_request(options)
  )
end

#query(query, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 234

def query query, options = {}
  execute(
    api_method: @bigquery.jobs.query,
    parameters: { projectId: @project },
    body_object: query_config(query, options)
  )
end

#query_job(query, options = {}) ⇒ `Object`

# File 'lib/gcloud/bigquery/connection.rb', line 226

def query_job query, options = {}
  execute(
    api_method: @bigquery.jobs.insert,
    parameters: { projectId: @project },
    body_object: query_table_config(query, options)
  )
end

Class: Gcloud::Bigquery::Connection

Overview

Constant Summary collapse

Instance Attribute Summary collapse

Class Method Summary collapse

Instance Method Summary collapse

Constructor Details

#initialize(project, credentials) ⇒ Connection

Instance Attribute Details

#credentials ⇒ Object

#project ⇒ Object

Class Method Details

.table_ref_from_s(str, default_table_ref) ⇒ Object

Instance Method Details

#copy_table(source, target, options = {}) ⇒ Object

#default_access_rules ⇒ Object

#delete_dataset(dataset_id, force = nil) ⇒ Object

#delete_table(dataset_id, table_id) ⇒ Object

#extract_table(table, storage_files, options = {}) ⇒ Object

#get_dataset(dataset_id) ⇒ Object

#get_job(job_id) ⇒ Object

#get_project_table(project_id, dataset_id, table_id) ⇒ Object

#get_table(dataset_id, table_id) ⇒ Object

#insert_dataset(dataset_id, options = {}) ⇒ Object

#insert_job(config) ⇒ Object

#insert_table(dataset_id, table_id, options = {}) ⇒ Object

#insert_tabledata(dataset_id, table_id, rows, options = {}) ⇒ Object

#inspect ⇒ Object

#job_query_results(job_id, options = {}) ⇒ Object

#link_table(table, urls, options = {}) ⇒ Object

#list_datasets(options = {}) ⇒ Object

#list_jobs(options = {}) ⇒ Object

#list_tabledata(dataset_id, table_id, options = {}) ⇒ Object

#list_tables(dataset_id, options = {}) ⇒ Object

#load_multipart(table, file, options = {}) ⇒ Object

#load_resumable(table, file, chunk_size = nil, options = {}) ⇒ Object

#load_table(table, storage_url, options = {}) ⇒ Object

#patch_dataset(dataset_id, options = {}) ⇒ Object

#patch_table(dataset_id, table_id, options = {}) ⇒ Object

#query(query, options = {}) ⇒ Object

#query_job(query, options = {}) ⇒ Object