Correct BigQuery partitioning/clustering metadata in ETL `metadata.yaml` files (#3500)
* Add missing BigQuery partitioning/clustering metadata. * Correct existing BigQuery partitioning/clustering metadata. * Allow partition `field` metadata field to be omitted. * List partition `type` metadata field first.
This commit is contained in:
Родитель
6978139496
Коммит
495ddcf39f
|
@ -57,8 +57,8 @@ class PartitionType(enum.Enum):
|
||||||
class PartitionMetadata:
|
class PartitionMetadata:
|
||||||
"""Metadata for defining BigQuery table partitions."""
|
"""Metadata for defining BigQuery table partitions."""
|
||||||
|
|
||||||
field: str
|
|
||||||
type: PartitionType
|
type: PartitionType
|
||||||
|
field: Optional[str] = attr.ib(None)
|
||||||
require_partition_filter: bool = attr.ib(True)
|
require_partition_filter: bool = attr.ib(True)
|
||||||
expiration_days: Optional[float] = attr.ib(None)
|
expiration_days: Optional[float] = attr.ib(None)
|
||||||
|
|
||||||
|
|
|
@ -58,8 +58,8 @@ owners:
|
||||||
- wlachance@mozilla.com
|
- wlachance@mozilla.com
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering:
|
clustering:
|
||||||
|
@ -91,8 +91,8 @@ owners:
|
||||||
- wlachance@mozilla.com
|
- wlachance@mozilla.com
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering:
|
clustering:
|
||||||
|
|
|
@ -25,3 +25,8 @@ scheduling:
|
||||||
# explicit query file path is necessary because the destination table
|
# explicit query file path is necessary because the destination table
|
||||||
# includes a partition identifier that is not in the path
|
# includes a partition identifier that is not in the path
|
||||||
sql/moz-fx-cjms-nonprod-9a36/cjms_bigquery/flows_v1/query.sql
|
sql/moz-fx-cjms-nonprod-9a36/cjms_bigquery/flows_v1/query.sql
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -9,3 +9,8 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_subplat
|
dag_name: bqetl_subplat
|
||||||
query_project: moz-fx-data-shared-prod
|
query_project: moz-fx-data-shared-prod
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,8 @@ owners:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_experiments_daily
|
dag_name: bqetl_experiments_daily
|
||||||
referenced_tables: [['region-us', 'INFORMATION_SCHEMA', 'JOBS_BY_PROJECT']]
|
referenced_tables: [['region-us', 'INFORMATION_SCHEMA', 'JOBS_BY_PROJECT']]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -21,13 +21,12 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: last_modified_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: last_modified_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
- double_opt_in
|
|
||||||
- has_opted_out_of_email
|
- has_opted_out_of_email
|
||||||
|
- double_opt_in
|
||||||
- email_lang
|
- email_lang
|
||||||
- mailing_country
|
- mailing_country
|
||||||
- cohort
|
|
||||||
|
|
|
@ -34,6 +34,12 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: last_modified_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: last_modified_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- has_opted_out_of_email
|
||||||
|
- double_opt_in
|
||||||
|
- email_lang
|
||||||
|
- mailing_country
|
||||||
|
|
|
@ -24,13 +24,12 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: last_modified_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: last_modified_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
- double_opt_in
|
|
||||||
- has_opted_out_of_email
|
- has_opted_out_of_email
|
||||||
|
- double_opt_in
|
||||||
- email_lang
|
- email_lang
|
||||||
- mailing_country
|
- mailing_country
|
||||||
- cohort
|
|
||||||
|
|
|
@ -37,6 +37,11 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- event_type
|
||||||
|
- recipient_type
|
||||||
|
- body_type
|
||||||
|
|
|
@ -24,8 +24,8 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -10,3 +10,14 @@ scheduling:
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_goals_v1']
|
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_goals_v1']
|
||||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_sessions_v1']
|
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_sessions_v1']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- country
|
||||||
|
- browser
|
||||||
|
- blog
|
||||||
|
- subblog
|
||||||
|
|
|
@ -9,3 +9,8 @@ scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_empty_check_v1']
|
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_empty_check_v1']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -11,3 +11,14 @@ scheduling:
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_goals_v1"]
|
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_goals_v1"]
|
||||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_sessions_v1"]
|
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_sessions_v1"]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- cleaned_landing_page
|
||||||
|
- browser
|
||||||
|
- blog
|
||||||
|
- subblog
|
||||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_empty_check_v1"]
|
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_empty_check_v1"]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,8 @@ owners:
|
||||||
- ascholtz@mozilla.com
|
- ascholtz@mozilla.com
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
||||||
- ascholtz@mozilla.com
|
- ascholtz@mozilla.com
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- page_name
|
||||||
|
- event_category
|
||||||
|
- event_action
|
||||||
|
- event_label
|
||||||
|
|
|
@ -9,3 +9,8 @@ scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'www_site_empty_check_v1']
|
- ['moz-fx-data-marketing-prod', 'ga_derived', 'www_site_empty_check_v1']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
||||||
- ascholtz@mozilla.com
|
- ascholtz@mozilla.com
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- page_name
|
||||||
|
- country
|
||||||
|
- locale
|
||||||
|
- medium
|
||||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
||||||
- ascholtz@mozilla.com
|
- ascholtz@mozilla.com
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- country
|
||||||
|
- browser
|
||||||
|
- source
|
||||||
|
- medium
|
||||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
||||||
- ascholtz@mozilla.com
|
- ascholtz@mozilla.com
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_google_analytics_derived
|
dag_name: bqetl_google_analytics_derived
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- page_name
|
||||||
|
- country
|
||||||
|
- locale
|
||||||
|
- medium
|
||||||
|
|
|
@ -13,6 +13,6 @@ scheduling:
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
|
|
@ -16,6 +16,6 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
|
|
@ -18,6 +18,6 @@ scheduling:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
|
|
@ -10,6 +10,15 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_activity_stream
|
dag_name: bqetl_activity_stream
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
expiration_days: 180
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- experiment_id
|
||||||
workgroup_access:
|
workgroup_access:
|
||||||
- role: roles/bigquery.dataViewer
|
- role: roles/bigquery.dataViewer
|
||||||
members:
|
members:
|
||||||
|
|
|
@ -8,6 +8,16 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_activity_stream
|
dag_name: bqetl_activity_stream
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
expiration_days: 180
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
- sample_id
|
||||||
workgroup_access:
|
workgroup_access:
|
||||||
- role: roles/bigquery.dataViewer
|
- role: roles/bigquery.dataViewer
|
||||||
members:
|
members:
|
||||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_amo_stats
|
dag_name: bqetl_amo_stats
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- addon_id
|
||||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_amo_stats
|
dag_name: bqetl_amo_stats
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- hashed_addon_id
|
||||||
|
|
|
@ -15,3 +15,11 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_amo_stats
|
dag_name: bqetl_amo_stats
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- addon_id
|
||||||
|
|
|
@ -15,3 +15,11 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_amo_stats
|
dag_name: bqetl_amo_stats
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- hashed_addon_id
|
||||||
|
|
|
@ -15,3 +15,11 @@ scheduling:
|
||||||
# query to get it, and that would be slow because main_v4 is referenced
|
# query to get it, and that would be slow because main_v4 is referenced
|
||||||
referenced_tables: [['moz-fx-data-shared-prod', 'telemetry_stable',
|
referenced_tables: [['moz-fx-data-shared-prod', 'telemetry_stable',
|
||||||
'main_v4']]
|
'main_v4']]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- sample_id
|
||||||
|
|
|
@ -12,3 +12,11 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_amo_stats
|
dag_name: bqetl_amo_stats
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- sample_id
|
||||||
|
|
|
@ -10,7 +10,7 @@ scheduling:
|
||||||
dag_name: bqetl_ctxsvc_derived
|
dag_name: bqetl_ctxsvc_derived
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
|
|
|
@ -8,5 +8,9 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_ctxsvc_derived
|
dag_name: bqetl_ctxsvc_derived
|
||||||
bigquery: null
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
references: {}
|
references: {}
|
||||||
|
|
|
@ -8,5 +8,9 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_ctxsvc_derived
|
dag_name: bqetl_ctxsvc_derived
|
||||||
bigquery: null
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
references: {}
|
references: {}
|
||||||
|
|
|
@ -9,3 +9,12 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_ctxsvc_derived
|
dag_name: bqetl_ctxsvc_derived
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- source
|
||||||
|
- event_type
|
||||||
|
|
|
@ -13,8 +13,8 @@ labels:
|
||||||
|
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: month
|
type: month
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
|
|
||||||
scheduling:
|
scheduling:
|
||||||
|
|
|
@ -26,9 +26,9 @@ scheduling:
|
||||||
execution_delta: 0h
|
execution_delta: 0h
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
require_partition_filter: true
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
- adjust_network
|
- adjust_network
|
||||||
|
|
|
@ -22,8 +22,8 @@ scheduling:
|
||||||
execution_delta: 1h
|
execution_delta: 1h
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fenix_event_rollup
|
dag_name: bqetl_fenix_event_rollup
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- category
|
||||||
|
- event
|
||||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
||||||
'event_types_v1'
|
'event_types_v1'
|
||||||
],
|
],
|
||||||
]
|
]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- sample_id
|
||||||
|
|
|
@ -43,8 +43,8 @@ scheduling:
|
||||||
- submission_date:DATE:{{ds}}
|
- submission_date:DATE:{{ds}}
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: first_seen_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: first_seen_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -7,8 +7,8 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering:
|
clustering:
|
||||||
|
|
|
@ -14,8 +14,8 @@ scheduling:
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering: null
|
clustering: null
|
||||||
|
|
|
@ -13,8 +13,8 @@ scheduling:
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering: null
|
clustering: null
|
||||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_event_rollup
|
dag_name: bqetl_event_rollup
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- category
|
||||||
|
- event
|
||||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
||||||
'event_types_v1'
|
'event_types_v1'
|
||||||
],
|
],
|
||||||
]
|
]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- sample_id
|
||||||
|
|
|
@ -9,3 +9,8 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -13,4 +13,8 @@ scheduling:
|
||||||
dag_name: bqetl_event_rollup
|
dag_name: bqetl_event_rollup
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
task_name: funnel_events_source__v1
|
task_name: funnel_events_source__v1
|
||||||
bigquery: null
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -9,3 +9,11 @@ labels:
|
||||||
application: fxa
|
application: fxa
|
||||||
incremental: true
|
incremental: true
|
||||||
schedule: daily
|
schedule: daily
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date_pacific
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- user_id
|
||||||
|
|
|
@ -15,3 +15,8 @@ labels:
|
||||||
# dag_name: bqetl_fxa_events
|
# dag_name: bqetl_fxa_events
|
||||||
# arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
# arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
# referenced_tables: []
|
# referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -16,3 +16,8 @@ scheduling:
|
||||||
# depends only on fxa logs produced via Stackdriver integration, so no other
|
# depends only on fxa logs produced via Stackdriver integration, so no other
|
||||||
# scheduled tasks are involved and the referenced_tables list is empty.
|
# scheduled tasks are involved and the referenced_tables list is empty.
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -14,3 +14,11 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- event
|
||||||
|
|
|
@ -14,3 +14,11 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- event
|
||||||
|
|
|
@ -17,3 +17,11 @@ scheduling:
|
||||||
# depends only on fxa logs produced via Stackdriver integration, so no other
|
# depends only on fxa logs produced via Stackdriver integration, so no other
|
||||||
# scheduled tasks are involved and the referenced_tables list is empty.
|
# scheduled tasks are involved and the referenced_tables list is empty.
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- command
|
||||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -15,8 +15,8 @@ scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -21,8 +21,8 @@ scheduling:
|
||||||
- submission_date:DATE:{{ds}}
|
- submission_date:DATE:{{ds}}
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: first_seen_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: first_seen_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -21,8 +21,8 @@ scheduling:
|
||||||
start_date: '2019-04-23'
|
start_date: '2019-04-23'
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering:
|
clustering:
|
||||||
|
|
|
@ -10,3 +10,12 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
date_partition_parameter: submission_date
|
date_partition_parameter: submission_date
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- service
|
||||||
|
- user_id
|
||||||
|
|
|
@ -24,8 +24,8 @@ scheduling:
|
||||||
date_partition_parameter: submission_date
|
date_partition_parameter: submission_date
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: timestamp
|
|
||||||
type: day
|
type: day
|
||||||
|
field: timestamp
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -25,8 +25,8 @@ scheduling:
|
||||||
]
|
]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: first_seen_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: first_seen_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -22,8 +22,8 @@ scheduling:
|
||||||
]
|
]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -15,3 +15,12 @@ labels:
|
||||||
# # making it incremental is possible but nuanced since it windows over
|
# # making it incremental is possible but nuanced since it windows over
|
||||||
# # events that may cross the midnight boundary.
|
# # events that may cross the midnight boundary.
|
||||||
# date_partition_parameter: null
|
# date_partition_parameter: null
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: first_service_timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- service
|
||||||
|
- user_id
|
||||||
|
|
|
@ -14,3 +14,12 @@ labels:
|
||||||
# dag_name: bqetl_fxa_events
|
# dag_name: bqetl_fxa_events
|
||||||
# depends_on_past: true
|
# depends_on_past: true
|
||||||
# start_date: '2019-10-08'
|
# start_date: '2019-10-08'
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- service
|
||||||
|
- user_id
|
||||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
referenced_tables: []
|
referenced_tables: []
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
|
|
@ -11,3 +11,8 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_fxa_events
|
dag_name: bqetl_fxa_events
|
||||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: true
|
||||||
|
|
|
@ -7,8 +7,8 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
expiration_days: null
|
expiration_days: null
|
||||||
clustering:
|
clustering:
|
||||||
|
|
|
@ -76,8 +76,8 @@ scheduling:
|
||||||
- health_v4
|
- health_v4
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: datetime
|
|
||||||
type: day
|
type: day
|
||||||
|
field: datetime
|
||||||
require_partition_filter: null
|
require_partition_filter: null
|
||||||
clustering:
|
clustering:
|
||||||
fields:
|
fields:
|
||||||
|
|
|
@ -8,3 +8,8 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_event_rollup
|
dag_name: bqetl_event_rollup
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- category
|
||||||
|
- event
|
||||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
||||||
'event_types_v1'
|
'event_types_v1'
|
||||||
],
|
],
|
||||||
]
|
]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- sample_id
|
||||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
task_name: messaging_system_onboarding_exact_mau28_by_dimensions
|
task_name: messaging_system_onboarding_exact_mau28_by_dimensions
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
task_name: messaging_system_snippets_exact_mau28_by_dimensions
|
task_name: messaging_system_snippets_exact_mau28_by_dimensions
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_messaging_system
|
dag_name: bqetl_messaging_system
|
||||||
depends_on_past: true
|
depends_on_past: true
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- release_channel
|
||||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-shared-prod', 'monitoring_derived', 'stable_table_sizes_v1']
|
- ['moz-fx-data-shared-prod', 'monitoring_derived', 'stable_table_sizes_v1']
|
||||||
- ['moz-fx-data-shared-prod', '*_stable', "*"]
|
- ['moz-fx-data-shared-prod', '*_stable', "*"]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -9,3 +9,8 @@ owners:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -10,3 +10,8 @@ owners:
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -10,6 +10,6 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: change_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: change_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
|
|
|
@ -10,5 +10,6 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: true
|
||||||
|
|
|
@ -10,6 +10,6 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: creation_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: creation_date
|
||||||
require_partition_filter: true
|
require_partition_filter: true
|
||||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -18,3 +18,8 @@ scheduling:
|
||||||
- ['moz-fx-data-shared-prod',
|
- ['moz-fx-data-shared-prod',
|
||||||
'monitoring',
|
'monitoring',
|
||||||
'payload_bytes_decoded_telemetry']
|
'payload_bytes_decoded_telemetry']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -9,3 +9,14 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
clustering:
|
||||||
|
fields:
|
||||||
|
- document_namespace
|
||||||
|
- document_type
|
||||||
|
- path
|
||||||
|
- job_name
|
||||||
|
|
|
@ -15,3 +15,8 @@ scheduling:
|
||||||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||||
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
||||||
- ['moz-fx-data-shared-prod', '*_derived', '*']
|
- ['moz-fx-data-shared-prod', '*_derived', '*']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -15,6 +15,6 @@ scheduling:
|
||||||
parameters: ["submission_date:DATE:{{ds}}"]
|
parameters: ["submission_date:DATE:{{ds}}"]
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
|
|
|
@ -10,8 +10,8 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
||||||
arguments: ["--date", "{{ ds }}"]
|
arguments: ["--date", "{{ ds }}"]
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -10,8 +10,8 @@ labels:
|
||||||
incremental: true
|
incremental: true
|
||||||
bigquery:
|
bigquery:
|
||||||
time_partitioning:
|
time_partitioning:
|
||||||
field: submission_date
|
|
||||||
type: day
|
type: day
|
||||||
|
field: submission_date
|
||||||
require_partition_filter: false
|
require_partition_filter: false
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
||||||
dag_name: bqetl_monitoring
|
dag_name: bqetl_monitoring
|
||||||
referenced_tables:
|
referenced_tables:
|
||||||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: submission_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -14,3 +14,8 @@ scheduling:
|
||||||
# delay aggregates by 7 days, to ensure data is complete
|
# delay aggregates by 7 days, to ensure data is complete
|
||||||
date_partition_offset: -7
|
date_partition_offset: -7
|
||||||
date_partition_parameter: date
|
date_partition_parameter: date
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: active_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
||||||
# delay aggregates by 7 days, to ensure data is complete
|
# delay aggregates by 7 days, to ensure data is complete
|
||||||
date_partition_offset: -7
|
date_partition_offset: -7
|
||||||
date_partition_parameter: date
|
date_partition_parameter: date
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: active_date
|
||||||
|
require_partition_filter: false
|
||||||
|
|
|
@ -8,3 +8,8 @@ labels:
|
||||||
schedule: daily
|
schedule: daily
|
||||||
scheduling:
|
scheduling:
|
||||||
dag_name: bqetl_subplat
|
dag_name: bqetl_subplat
|
||||||
|
bigquery:
|
||||||
|
time_partitioning:
|
||||||
|
type: day
|
||||||
|
field: timestamp
|
||||||
|
require_partition_filter: false
|
||||||
|
|
Некоторые файлы не были показаны из-за слишком большого количества измененных файлов Показать больше
Загрузка…
Ссылка в новой задаче