mozilla / bigquery-etl

Bigquery ETL
https://mozilla.github.io/bigquery-etl
Mozilla Public License 2.0
253 stars 100 forks source link

updating to remove partition parameter and add append table and no replace flags #5719

Closed chelseybeck closed 4 months ago

chelseybeck commented 4 months ago

Checklist for reviewer:

For modifications to schemas in restricted namespaces (see CODEOWNERS):

┆Issue is synchronized with this Jira Task

dataops-ci-bot commented 4 months ago

Integration report for "updating to remove partition parameter and add tags"

sql.diff

Click to expand! ```diff diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/dags/bqetl_braze.py /tmp/workspace/generated-sql/dags/bqetl_braze.py --- /tmp/workspace/main-generated-sql/dags/bqetl_braze.py 2024-06-03 19:54:29.000000000 +0000 +++ /tmp/workspace/generated-sql/dags/bqetl_braze.py 2024-06-03 19:55:56.000000000 +0000 @@ -146,8 +146,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__changed_newsletters_sync__v1 = bigquery_etl_query( @@ -157,8 +159,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__changed_products_sync__v1 = bigquery_etl_query( @@ -168,8 +172,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__changed_users__v1 = bigquery_etl_query( @@ -191,8 +197,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__changed_waitlists_sync__v1 = bigquery_etl_query( @@ -202,8 +210,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__delete_users_sync__v1 = bigquery_etl_query( @@ -213,8 +223,10 @@ project_id="moz-fx-data-shared-prod", owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], - date_partition_parameter="updated_at", + date_partition_parameter=None, depends_on_past=False, + task_concurrency=1, + arguments=["--append_table", "--noreplace"], ) braze_external__users_previous_day_snapshot__v1 = bigquery_etl_query( @@ -341,7 +353,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) @@ -354,7 +367,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) @@ -367,7 +381,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) @@ -393,7 +408,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) @@ -406,7 +422,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) @@ -419,7 +436,8 @@ owner="cbeck@mozilla.com", email=["cbeck@mozilla.com", "leli@mozilla.com"], depends_on_past=False, - parameters=["updated_at:DATE:{{ds}}"], + task_concurrency=1, + arguments=["--append_table", "--noreplace"], retries=0, ) diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_firefox_subscriptions_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_firefox_subscriptions_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_firefox_subscriptions_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_firefox_subscriptions_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -15,7 +15,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_newsletters_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_newsletters_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_newsletters_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_newsletters_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -14,7 +14,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_products_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_products_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_products_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_products_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -14,7 +14,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_users_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_users_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_users_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_users_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -14,7 +14,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_waitlists_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_waitlists_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_waitlists_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/changed_waitlists_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -14,7 +14,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null diff -bur --no-dereference --new-file /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/delete_users_sync_v1/metadata.yaml /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/delete_users_sync_v1/metadata.yaml --- /tmp/workspace/main-generated-sql/sql/moz-fx-data-shared-prod/braze_external/delete_users_sync_v1/metadata.yaml 2024-06-03 19:52:33.000000000 +0000 +++ /tmp/workspace/generated-sql/sql/moz-fx-data-shared-prod/braze_external/delete_users_sync_v1/metadata.yaml 2024-06-03 19:52:46.000000000 +0000 @@ -23,7 +23,10 @@ owner1: cbeck scheduling: dag_name: bqetl_braze - date_partition_parameter: updated_at + date_partition_parameter: null + arguments: + - --append_table + - --noreplace bigquery: time_partitioning: null range_partitioning: null ```

Link to full diff