-
Notifications
You must be signed in to change notification settings - Fork 309
Commit
This commit does not belong to any branch on this repository, and may belong to a fork outside of the repository.
refactor(bigquery): update code samples of load table autodetect and …
…truncate (#28) Co-authored-by: Peter Lamut <plamut@users.noreply.github.com>
- Loading branch information
1 parent
da40b62
commit 18eb9e8
Showing
16 changed files
with
571 additions
and
168 deletions.
There are no files selected for viewing
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,45 @@ | ||
# Copyright 2020 Google LLC | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
|
||
def load_table_uri_autodetect_csv(table_id): | ||
|
||
# [START bigquery_load_table_gcs_csv_autodetect] | ||
from google.cloud import bigquery | ||
|
||
# Construct a BigQuery client object. | ||
client = bigquery.Client() | ||
|
||
# TODO(developer): Set table_id to the ID of the table to create. | ||
# table_id = "your-project.your_dataset.your_table_name | ||
|
||
# Set the encryption key to use for the destination. | ||
# TODO: Replace this key with a key you have created in KMS. | ||
# kms_key_name = "projects/{}/locations/{}/keyRings/{}/cryptoKeys/{}".format( | ||
# "cloud-samples-tests", "us", "test", "test" | ||
# ) | ||
job_config = bigquery.LoadJobConfig( | ||
autodetect=True, | ||
skip_leading_rows=1, | ||
# The source format defaults to CSV, so the line below is optional. | ||
source_format=bigquery.SourceFormat.CSV, | ||
) | ||
uri = "gs://cloud-samples-data/bigquery/us-states/us-states.csv" | ||
load_job = client.load_table_from_uri( | ||
uri, table_id, job_config=job_config | ||
) # Make an API request. | ||
load_job.result() # Waits for the job to complete. | ||
destination_table = client.get_table(table_id) | ||
print("Loaded {} rows.".format(destination_table.num_rows)) | ||
# [END bigquery_load_table_gcs_csv_autodetect] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,42 @@ | ||
# Copyright 2020 Google LLC | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
|
||
def load_table_uri_autodetect_json(table_id): | ||
|
||
# [START bigquery_load_table_gcs_json_autodetect] | ||
from google.cloud import bigquery | ||
|
||
# Construct a BigQuery client object. | ||
client = bigquery.Client() | ||
|
||
# TODO(developer): Set table_id to the ID of the table to create. | ||
# table_id = "your-project.your_dataset.your_table_name | ||
|
||
# Set the encryption key to use for the destination. | ||
# TODO: Replace this key with a key you have created in KMS. | ||
# kms_key_name = "projects/{}/locations/{}/keyRings/{}/cryptoKeys/{}".format( | ||
# "cloud-samples-tests", "us", "test", "test" | ||
# ) | ||
job_config = bigquery.LoadJobConfig( | ||
autodetect=True, source_format=bigquery.SourceFormat.NEWLINE_DELIMITED_JSON | ||
) | ||
uri = "gs://cloud-samples-data/bigquery/us-states/us-states.json" | ||
load_job = client.load_table_from_uri( | ||
uri, table_id, job_config=job_config | ||
) # Make an API request. | ||
load_job.result() # Waits for the job to complete. | ||
destination_table = client.get_table(table_id) | ||
print("Loaded {} rows.".format(destination_table.num_rows)) | ||
# [END bigquery_load_table_gcs_json_autodetect] |
This file contains bidirectional Unicode text that may be interpreted or compiled differently than what appears below. To review, open the file in an editor that reveals hidden Unicode characters.
Learn more about bidirectional Unicode characters
Original file line number | Diff line number | Diff line change |
---|---|---|
@@ -0,0 +1,55 @@ | ||
# Copyright 2020 Google LLC | ||
# | ||
# Licensed under the Apache License, Version 2.0 (the "License"); | ||
# you may not use this file except in compliance with the License. | ||
# You may obtain a copy of the License at | ||
# | ||
# http://www.apache.org/licenses/LICENSE-2.0 | ||
# | ||
# Unless required by applicable law or agreed to in writing, software | ||
# distributed under the License is distributed on an "AS IS" BASIS, | ||
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied. | ||
# See the License for the specific language governing permissions and | ||
# limitations under the License. | ||
|
||
|
||
def load_table_uri_truncate_avro(table_id): | ||
|
||
# [START bigquery_load_table_gcs_avro_truncate] | ||
import six | ||
|
||
from google.cloud import bigquery | ||
|
||
# Construct a BigQuery client object. | ||
client = bigquery.Client() | ||
|
||
# TODO(developer): Set table_id to the ID of the table to create. | ||
# table_id = "your-project.your_dataset.your_table_name | ||
|
||
job_config = bigquery.LoadJobConfig( | ||
schema=[ | ||
bigquery.SchemaField("name", "STRING"), | ||
bigquery.SchemaField("post_abbr", "STRING"), | ||
], | ||
) | ||
|
||
body = six.BytesIO(b"Washington,WA") | ||
client.load_table_from_file(body, table_id, job_config=job_config).result() | ||
previous_rows = client.get_table(table_id).num_rows | ||
assert previous_rows > 0 | ||
|
||
job_config = bigquery.LoadJobConfig( | ||
write_disposition=bigquery.WriteDisposition.WRITE_TRUNCATE, | ||
source_format=bigquery.SourceFormat.AVRO, | ||
) | ||
|
||
uri = "gs://cloud-samples-data/bigquery/us-states/us-states.avro" | ||
load_job = client.load_table_from_uri( | ||
uri, table_id, job_config=job_config | ||
) # Make an API request. | ||
|
||
load_job.result() # Waits for the job to complete. | ||
|
||
destination_table = client.get_table(table_id) | ||
print("Loaded {} rows.".format(destination_table.num_rows)) | ||
# [END bigquery_load_table_gcs_avro_truncate] |
Oops, something went wrong.