Skip to content

Commit fa569fd

Browse files
10148 BigQuery Destination/Denormalized Destination spec updates
1 parent 5cc2027 commit fa569fd

File tree

3 files changed

+20
-18
lines changed
  • airbyte-integrations/connectors
    • destination-bigquery/src/main/resources
    • destination-bigquery-denormalized/src/main/resources
  • docs/integrations/destinations

3 files changed

+20
-18
lines changed

airbyte-integrations/connectors/destination-bigquery-denormalized/src/main/resources/spec.json

Lines changed: 16 additions & 16 deletions
Original file line numberDiff line numberDiff line change
@@ -12,8 +12,8 @@
1212
"additionalProperties": true,
1313
"properties": {
1414
"big_query_client_buffer_size_mb": {
15-
"title": "Google BigQuery client chunk size",
16-
"description": "Google BigQuery client's chunk (buffer) size (MIN = 1, MAX = 15) for each table. The size that will be written by a single RPC. Written data will be buffered and only flushed upon reaching this size or closing the channel. It defaults to 15MiB. Smaller chunk size means less memory consumption, and is recommended for big data sets. For more details refer to the documentation <a href=\"https://googleapis.dev/python/bigquery/latest/generated/google.cloud.bigquery.client.Client.html\">here</a>",
15+
"title": "Google BigQuery Client Chunk Size (Optional)",
16+
"description": "Google BigQuery client's chunk (buffer) size (MIN=1, MAX = 15) for each table. The size that will be written by a single RPC. Written data will be buffered and only flushed upon reaching this size or closing the channel. The default 15MB value is used if not set explicitly. Read more <a href=\"https://googleapis.dev/python/bigquery/latest/generated/google.cloud.bigquery.client.Client.html\">here</a>.",
1717
"type": "integer",
1818
"minimum": 1,
1919
"maximum": 15,
@@ -22,18 +22,18 @@
2222
},
2323
"project_id": {
2424
"type": "string",
25-
"description": "The GCP project ID for the project containing the target BigQuery dataset.",
25+
"description": "The GCP project ID for the project containing the target BigQuery dataset. Read more <a href=\"https://cloud.google.com/resource-manager/docs/creating-managing-projects#identifying_projects\">here</a>.",
2626
"title": "Project ID"
2727
},
2828
"dataset_id": {
2929
"type": "string",
30-
"description": "Default BigQuery Dataset ID tables are replicated to if the source does not specify a namespace.",
30+
"description": "The default BigQuery Dataset ID that tables are replicated to if the source does not specify a namespace. Read more <a href=\"https://cloud.google.com/bigquery/docs/datasets#create-dataset\">here</a>.",
3131
"title": "Default Dataset ID"
3232
},
3333
"dataset_location": {
3434
"type": "string",
35-
"description": "The location of the dataset. Warning: Changes made after creation will not be applied.",
36-
"title": "Dataset Location",
35+
"description": "The location of the dataset. Warning: Changes made after creation will not be applied. The default \"US\" value is used if not set explicitly. Read more <a href=\"https://cloud.google.com/bigquery/docs/locations\">here</a>.",
36+
"title": "Dataset Location (Optional)",
3737
"default": "US",
3838
"enum": [
3939
"US",
@@ -71,19 +71,18 @@
7171
},
7272
"credentials_json": {
7373
"type": "string",
74-
"description": "The contents of the JSON service account key. Check out the <a href=\"https://docs.airbyte.io/integrations/destinations/bigquery\">docs</a> if you need help generating this key. Default credentials will be used if this field is left empty.",
75-
"title": "Credentials JSON",
74+
"description": "The contents of the JSON service account key. Check out the <a href=\"https://docs.airbyte.com/integrations/destinations/bigquery#service-account-key\">docs</a> if you need help generating this key. Default credentials will be used if this field is left empty.",
75+
"title": "Service Account Key JSON (Optional)",
7676
"airbyte_secret": true
7777
},
7878
"loading_method": {
7979
"type": "object",
80-
"title": "Loading Method",
81-
"description": "Select the way that data will be uploaded to BigQuery.",
80+
"title": "Loading Method *",
81+
"description": "Loading method used to send select the way data will be uploaded to BigQuery. <br><b>Standard Inserts</b> - Direct uploading using SQL INSERT statements. This method is extremely inefficient and provided only for quick testing. In almost all cases, you should use staging. <br><b>GCS Staging</b> - Writes large batches of records to a file, uploads the file to GCS, then uses <b>COPY INTO table</b> to upload the file. Recommended for most workloads for better speed and scalability. Read more about GCS Staging <a href=\"https://docs.airbyte.com/integrations/destinations/bigquery#gcs-staging\">here</a>.",
8282
"oneOf": [
8383
{
8484
"title": "Standard Inserts",
8585
"additionalProperties": false,
86-
"description": "Direct uploading using streams.",
8786
"required": ["method"],
8887
"properties": {
8988
"method": {
@@ -95,7 +94,6 @@
9594
{
9695
"title": "GCS Staging",
9796
"additionalProperties": false,
98-
"description": "Writes large batches of records to a file, uploads the file to GCS, then uses <pre>COPY INTO table</pre> to upload the file. Recommended for large production workloads for better speed and scalability.",
9997
"required": [
10098
"method",
10199
"gcs_bucket_name",
@@ -110,16 +108,17 @@
110108
"gcs_bucket_name": {
111109
"title": "GCS Bucket Name",
112110
"type": "string",
113-
"description": "The name of the GCS bucket.",
111+
"description": "The name of the GCS bucket. Read more <a href=\"https://cloud.google.com/storage/docs/naming-buckets\">here</a>.",
114112
"examples": ["airbyte_sync"]
115113
},
116114
"gcs_bucket_path": {
115+
"title": "GCS Bucket Path",
117116
"description": "Directory under the GCS bucket where data will be written.",
118117
"type": "string",
119118
"examples": ["data_sync/test"]
120119
},
121120
"part_size_mb": {
122-
"title": "Block Size (MB) for GCS multipart upload",
121+
"title": "Block Size (MB) for GCS Multipart Upload (Optional)",
123122
"description": "This is the size of a \"Part\" being buffered in memory. It limits the memory usage when writing. Larger values will allow to upload a bigger files and improve the speed, but consumes more memory. Allowed values: min=5MB, max=525MB Default: 5MB.",
124123
"type": "integer",
125124
"default": 5,
@@ -129,8 +128,8 @@
129128
},
130129
"keep_files_in_gcs-bucket": {
131130
"type": "string",
132-
"description": "This upload method is supposed to temporary store records in GCS bucket. What do you want to do with data in GCS bucket when migration has finished?",
133-
"title": "GCS tmp files afterward processing",
131+
"description": "This upload method is supposed to temporary store records in GCS bucket. What do you want to do with data in GCS bucket when migration has finished? The default \"Delete all tmp files from GCS\" value is used if not set explicitly.",
132+
"title": "GCS Tmp Files Afterward Processing (Optional)",
134133
"default": "Delete all tmp files from GCS",
135134
"enum": [
136135
"Delete all tmp files from GCS",
@@ -139,6 +138,7 @@
139138
},
140139
"credential": {
141140
"title": "Credential",
141+
"description": "An HMAC key is a type of credential and can be associated with a service account or a user account in Cloud Storage. Read more <a href=\"https://cloud.google.com/storage/docs/authentication/hmackeys\">here</a>.",
142142
"type": "object",
143143
"oneOf": [
144144
{

airbyte-integrations/connectors/destination-bigquery/src/main/resources/spec.json

Lines changed: 2 additions & 2 deletions
Original file line numberDiff line numberDiff line change
@@ -22,7 +22,7 @@
2222
},
2323
"project_id": {
2424
"type": "string",
25-
"description": "The GCP project ID for the project containing the target BigQuery dataset. Read more <a href=\"https://cloud.google.com/iam/docs/creating-managing-service-accounts#creating\">here</a>.",
25+
"description": "The GCP project ID for the project containing the target BigQuery dataset. Read more <a href=\"https://cloud.google.com/resource-manager/docs/creating-managing-projects#identifying_projects\">here</a>.",
2626
"title": "Project ID"
2727
},
2828
"dataset_id": {
@@ -72,7 +72,7 @@
7272
"credentials_json": {
7373
"type": "string",
7474
"description": "The contents of the JSON service account key. Check out the <a href=\"https://docs.airbyte.com/integrations/destinations/bigquery#service-account-key\">docs</a> if you need help generating this key. Default credentials will be used if this field is left empty.",
75-
"title": "Credentials JSON (Optional)",
75+
"title": "Service Account Key JSON (Optional)",
7676
"airbyte_secret": true
7777
},
7878
"transformation_priority": {

docs/integrations/destinations/bigquery.md

Lines changed: 2 additions & 0 deletions
Original file line numberDiff line numberDiff line change
@@ -207,6 +207,7 @@ This uploads data directly from your source to BigQuery. While this is faster to
207207
208208
| Version | Date | Pull Request | Subject |
209209
|:--------| :--- | :--- | :--- |
210+
| 1.0.2 | 2022-03-30 | [](https://github.com/airbytehq/airbyte/pull/) | Updated spec |
210211
| 1.0.1 | 2022-03-24 | [11350](https://github.com/airbytehq/airbyte/pull/11350) | Improve check performance |
211212
| 1.0.0 | 2022-03-18 | [11238](https://github.com/airbytehq/airbyte/pull/11238) | Updated spec and documentation |
212213
| 0.6.12 | 2022-03-18 | [10793](https://github.com/airbytehq/airbyte/pull/10793) | Fix namespace with invalid characters |
@@ -235,6 +236,7 @@ This uploads data directly from your source to BigQuery. While this is faster to
235236
236237
| Version | Date | Pull Request | Subject |
237238
|:--------|:-----------|:-----------------------------------------------------------| :--- |
239+
| 0.2.12 | 2022-03-30 | [](https://github.com/airbytehq/airbyte/pull/) | Updated spec |
238240
| 0.2.11 | 2022-03-18 | [10793](https://github.com/airbytehq/airbyte/pull/10793) | Fix namespace with invalid characters |
239241
| 0.2.10 | 2022-03-03 | [10755](https://github.com/airbytehq/airbyte/pull/10755) | Make sure to kill children threads and stop JVM |
240242
| 0.2.8 | 2022-02-14 | [10256](https://github.com/airbytehq/airbyte/pull/10256) | Add `-XX:+ExitOnOutOfMemoryError` JVM option |

0 commit comments

Comments
 (0)