Correct BigQuery partitioning/clustering metadata in ETL `metadata.yaml` files (#3500)
* Add missing BigQuery partitioning/clustering metadata. * Correct existing BigQuery partitioning/clustering metadata. * Allow partition `field` metadata field to be omitted. * List partition `type` metadata field first.
This commit is contained in:
Родитель
6978139496
Коммит
495ddcf39f
|
@ -57,8 +57,8 @@ class PartitionType(enum.Enum):
|
|||
class PartitionMetadata:
|
||||
"""Metadata for defining BigQuery table partitions."""
|
||||
|
||||
field: str
|
||||
type: PartitionType
|
||||
field: Optional[str] = attr.ib(None)
|
||||
require_partition_filter: bool = attr.ib(True)
|
||||
expiration_days: Optional[float] = attr.ib(None)
|
||||
|
||||
|
|
|
@ -58,8 +58,8 @@ owners:
|
|||
- wlachance@mozilla.com
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: date
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
clustering:
|
||||
|
@ -91,8 +91,8 @@ owners:
|
|||
- wlachance@mozilla.com
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: date
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
clustering:
|
||||
|
|
|
@ -25,3 +25,8 @@ scheduling:
|
|||
# explicit query file path is necessary because the destination table
|
||||
# includes a partition identifier that is not in the path
|
||||
sql/moz-fx-cjms-nonprod-9a36/cjms_bigquery/flows_v1/query.sql
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -9,3 +9,8 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_subplat
|
||||
query_project: moz-fx-data-shared-prod
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,8 @@ owners:
|
|||
scheduling:
|
||||
dag_name: bqetl_experiments_daily
|
||||
referenced_tables: [['region-us', 'INFORMATION_SCHEMA', 'JOBS_BY_PROJECT']]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_timestamp
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -21,13 +21,12 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: last_modified_date
|
||||
type: day
|
||||
field: last_modified_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- double_opt_in
|
||||
- has_opted_out_of_email
|
||||
- double_opt_in
|
||||
- email_lang
|
||||
- mailing_country
|
||||
- cohort
|
||||
|
|
|
@ -34,6 +34,12 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: last_modified_date
|
||||
type: day
|
||||
field: last_modified_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- has_opted_out_of_email
|
||||
- double_opt_in
|
||||
- email_lang
|
||||
- mailing_country
|
||||
|
|
|
@ -24,13 +24,12 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: last_modified_date
|
||||
type: day
|
||||
field: last_modified_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- double_opt_in
|
||||
- has_opted_out_of_email
|
||||
- double_opt_in
|
||||
- email_lang
|
||||
- mailing_country
|
||||
- cohort
|
||||
|
|
|
@ -37,6 +37,11 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- event_type
|
||||
- recipient_type
|
||||
- body_type
|
||||
|
|
|
@ -24,8 +24,8 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -10,3 +10,14 @@ scheduling:
|
|||
referenced_tables:
|
||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_goals_v1']
|
||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_sessions_v1']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- country
|
||||
- browser
|
||||
- blog
|
||||
- subblog
|
||||
|
|
|
@ -9,3 +9,8 @@ scheduling:
|
|||
dag_name: bqetl_google_analytics_derived
|
||||
referenced_tables:
|
||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_empty_check_v1']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -11,3 +11,14 @@ scheduling:
|
|||
referenced_tables:
|
||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_goals_v1"]
|
||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_sessions_v1"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- cleaned_landing_page
|
||||
- browser
|
||||
- blog
|
||||
- subblog
|
||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
|||
dag_name: bqetl_google_analytics_derived
|
||||
referenced_tables:
|
||||
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_empty_check_v1"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,8 @@ owners:
|
|||
- ascholtz@mozilla.com
|
||||
scheduling:
|
||||
dag_name: bqetl_google_analytics_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
|||
- ascholtz@mozilla.com
|
||||
scheduling:
|
||||
dag_name: bqetl_google_analytics_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- page_name
|
||||
- event_category
|
||||
- event_action
|
||||
- event_label
|
||||
|
|
|
@ -9,3 +9,8 @@ scheduling:
|
|||
dag_name: bqetl_google_analytics_derived
|
||||
referenced_tables:
|
||||
- ['moz-fx-data-marketing-prod', 'ga_derived', 'www_site_empty_check_v1']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
|||
- ascholtz@mozilla.com
|
||||
scheduling:
|
||||
dag_name: bqetl_google_analytics_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- page_name
|
||||
- country
|
||||
- locale
|
||||
- medium
|
||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
|||
- ascholtz@mozilla.com
|
||||
scheduling:
|
||||
dag_name: bqetl_google_analytics_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- country
|
||||
- browser
|
||||
- source
|
||||
- medium
|
||||
|
|
|
@ -7,3 +7,14 @@ owners:
|
|||
- ascholtz@mozilla.com
|
||||
scheduling:
|
||||
dag_name: bqetl_google_analytics_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- page_name
|
||||
- country
|
||||
- locale
|
||||
- medium
|
||||
|
|
|
@ -13,6 +13,6 @@ scheduling:
|
|||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -16,6 +16,6 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -18,6 +18,6 @@ scheduling:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -10,6 +10,15 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_activity_stream
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_timestamp
|
||||
require_partition_filter: true
|
||||
expiration_days: 180
|
||||
clustering:
|
||||
fields:
|
||||
- experiment_id
|
||||
workgroup_access:
|
||||
- role: roles/bigquery.dataViewer
|
||||
members:
|
||||
|
|
|
@ -8,6 +8,16 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_activity_stream
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_timestamp
|
||||
require_partition_filter: true
|
||||
expiration_days: 180
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
- sample_id
|
||||
workgroup_access:
|
||||
- role: roles/bigquery.dataViewer
|
||||
members:
|
||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_amo_stats
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- addon_id
|
||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_amo_stats
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- hashed_addon_id
|
||||
|
|
|
@ -15,3 +15,11 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_amo_stats
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- addon_id
|
||||
|
|
|
@ -15,3 +15,11 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_amo_stats
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- hashed_addon_id
|
||||
|
|
|
@ -15,3 +15,11 @@ scheduling:
|
|||
# query to get it, and that would be slow because main_v4 is referenced
|
||||
referenced_tables: [['moz-fx-data-shared-prod', 'telemetry_stable',
|
||||
'main_v4']]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- sample_id
|
||||
|
|
|
@ -12,3 +12,11 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_amo_stats
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- sample_id
|
||||
|
|
|
@ -10,7 +10,7 @@ scheduling:
|
|||
dag_name: bqetl_ctxsvc_derived
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
|
|
|
@ -8,5 +8,9 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_ctxsvc_derived
|
||||
bigquery: null
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
references: {}
|
||||
|
|
|
@ -8,5 +8,9 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_ctxsvc_derived
|
||||
bigquery: null
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
references: {}
|
||||
|
|
|
@ -9,3 +9,12 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_ctxsvc_derived
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- source
|
||||
- event_type
|
||||
|
|
|
@ -13,8 +13,8 @@ labels:
|
|||
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: month
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
|
||||
scheduling:
|
||||
|
|
|
@ -26,9 +26,9 @@ scheduling:
|
|||
execution_delta: 0h
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
require_partition_filter: true
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- adjust_network
|
||||
|
|
|
@ -22,8 +22,8 @@ scheduling:
|
|||
execution_delta: 1h
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fenix_event_rollup
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- category
|
||||
- event
|
||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
|||
'event_types_v1'
|
||||
],
|
||||
]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- sample_id
|
||||
|
|
|
@ -43,8 +43,8 @@ scheduling:
|
|||
- submission_date:DATE:{{ds}}
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: first_seen_date
|
||||
type: day
|
||||
field: first_seen_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -7,8 +7,8 @@ labels:
|
|||
incremental: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
clustering:
|
||||
|
|
|
@ -14,8 +14,8 @@ scheduling:
|
|||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: date
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
expiration_days: null
|
||||
clustering: null
|
||||
|
|
|
@ -13,8 +13,8 @@ scheduling:
|
|||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: date
|
||||
type: day
|
||||
field: date
|
||||
require_partition_filter: false
|
||||
expiration_days: null
|
||||
clustering: null
|
||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_event_rollup
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- category
|
||||
- event
|
||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
|||
'event_types_v1'
|
||||
],
|
||||
]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- sample_id
|
||||
|
|
|
@ -9,3 +9,8 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -13,4 +13,8 @@ scheduling:
|
|||
dag_name: bqetl_event_rollup
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
task_name: funnel_events_source__v1
|
||||
bigquery: null
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -9,3 +9,11 @@ labels:
|
|||
application: fxa
|
||||
incremental: true
|
||||
schedule: daily
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date_pacific
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- user_id
|
||||
|
|
|
@ -15,3 +15,8 @@ labels:
|
|||
# dag_name: bqetl_fxa_events
|
||||
# arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
# referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
|||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
|||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -16,3 +16,8 @@ scheduling:
|
|||
# depends only on fxa logs produced via Stackdriver integration, so no other
|
||||
# scheduled tasks are involved and the referenced_tables list is empty.
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_timestamp
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -14,3 +14,11 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- event
|
||||
|
|
|
@ -14,3 +14,11 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- event
|
||||
|
|
|
@ -17,3 +17,11 @@ scheduling:
|
|||
# depends only on fxa logs produced via Stackdriver integration, so no other
|
||||
# scheduled tasks are involved and the referenced_tables list is empty.
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- command
|
||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -15,8 +15,8 @@ scheduling:
|
|||
dag_name: bqetl_fxa_events
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -21,8 +21,8 @@ scheduling:
|
|||
- submission_date:DATE:{{ds}}
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: first_seen_date
|
||||
type: day
|
||||
field: first_seen_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -21,8 +21,8 @@ scheduling:
|
|||
start_date: '2019-04-23'
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
clustering:
|
||||
|
|
|
@ -10,3 +10,12 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
date_partition_parameter: submission_date
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- service
|
||||
- user_id
|
||||
|
|
|
@ -24,8 +24,8 @@ scheduling:
|
|||
date_partition_parameter: submission_date
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: timestamp
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -25,8 +25,8 @@ scheduling:
|
|||
]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: first_seen_date
|
||||
type: day
|
||||
field: first_seen_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -22,8 +22,8 @@ scheduling:
|
|||
]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -15,3 +15,12 @@ labels:
|
|||
# # making it incremental is possible but nuanced since it windows over
|
||||
# # events that may cross the midnight boundary.
|
||||
# date_partition_parameter: null
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: first_service_timestamp
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- service
|
||||
- user_id
|
||||
|
|
|
@ -14,3 +14,12 @@ labels:
|
|||
# dag_name: bqetl_fxa_events
|
||||
# depends_on_past: true
|
||||
# start_date: '2019-10-08'
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- service
|
||||
- user_id
|
||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
|||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
|||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
referenced_tables: []
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -11,3 +11,8 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_fxa_events
|
||||
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -7,8 +7,8 @@ labels:
|
|||
incremental: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
expiration_days: null
|
||||
clustering:
|
||||
|
|
|
@ -76,8 +76,8 @@ scheduling:
|
|||
- health_v4
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: datetime
|
||||
type: day
|
||||
field: datetime
|
||||
require_partition_filter: null
|
||||
clustering:
|
||||
fields:
|
||||
|
|
|
@ -8,3 +8,8 @@ labels:
|
|||
incremental: true
|
||||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
|||
incremental: true
|
||||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -17,3 +17,12 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_event_rollup
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- category
|
||||
- event
|
||||
|
|
|
@ -20,3 +20,11 @@ scheduling:
|
|||
'event_types_v1'
|
||||
],
|
||||
]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- sample_id
|
||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
task_name: messaging_system_onboarding_exact_mau28_by_dimensions
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
|||
incremental: true
|
||||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -10,3 +10,8 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
task_name: messaging_system_snippets_exact_mau28_by_dimensions
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -7,3 +7,11 @@ labels:
|
|||
incremental: true
|
||||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -10,3 +10,11 @@ labels:
|
|||
scheduling:
|
||||
dag_name: bqetl_messaging_system
|
||||
depends_on_past: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
clustering:
|
||||
fields:
|
||||
- release_channel
|
||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
|||
referenced_tables:
|
||||
- ['moz-fx-data-shared-prod', 'monitoring_derived', 'stable_table_sizes_v1']
|
||||
- ['moz-fx-data-shared-prod', '*_stable', "*"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -9,3 +9,8 @@ owners:
|
|||
scheduling:
|
||||
dag_name: bqetl_monitoring
|
||||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -10,3 +10,8 @@ owners:
|
|||
scheduling:
|
||||
dag_name: bqetl_monitoring
|
||||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -10,6 +10,6 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: change_date
|
||||
type: day
|
||||
field: change_date
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -10,5 +10,6 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -10,6 +10,6 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: creation_date
|
||||
type: day
|
||||
field: creation_date
|
||||
require_partition_filter: true
|
||||
|
|
|
@ -10,3 +10,8 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
referenced_tables:
|
||||
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -18,3 +18,8 @@ scheduling:
|
|||
- ['moz-fx-data-shared-prod',
|
||||
'monitoring',
|
||||
'payload_bytes_decoded_telemetry']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -9,3 +9,14 @@ labels:
|
|||
incremental: true
|
||||
scheduling:
|
||||
dag_name: bqetl_monitoring
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
clustering:
|
||||
fields:
|
||||
- document_namespace
|
||||
- document_type
|
||||
- path
|
||||
- job_name
|
||||
|
|
|
@ -15,3 +15,8 @@ scheduling:
|
|||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
|
||||
- ['moz-fx-data-shared-prod', '*_derived', '*']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -15,6 +15,6 @@ scheduling:
|
|||
parameters: ["submission_date:DATE:{{ds}}"]
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -10,8 +10,8 @@ labels:
|
|||
incremental: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
scheduling:
|
||||
dag_name: bqetl_monitoring
|
||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
|||
arguments: ["--date", "{{ ds }}"]
|
||||
referenced_tables:
|
||||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -10,8 +10,8 @@ labels:
|
|||
incremental: true
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
field: submission_date
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
scheduling:
|
||||
dag_name: bqetl_monitoring
|
||||
|
|
|
@ -12,3 +12,8 @@ scheduling:
|
|||
dag_name: bqetl_monitoring
|
||||
referenced_tables:
|
||||
- ['moz-fx-data-shared-prod', '*_stable', '*']
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: submission_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -14,3 +14,8 @@ scheduling:
|
|||
# delay aggregates by 7 days, to ensure data is complete
|
||||
date_partition_offset: -7
|
||||
date_partition_parameter: date
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: active_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -11,3 +11,8 @@ scheduling:
|
|||
# delay aggregates by 7 days, to ensure data is complete
|
||||
date_partition_offset: -7
|
||||
date_partition_parameter: date
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: active_date
|
||||
require_partition_filter: false
|
||||
|
|
|
@ -8,3 +8,8 @@ labels:
|
|||
schedule: daily
|
||||
scheduling:
|
||||
dag_name: bqetl_subplat
|
||||
bigquery:
|
||||
time_partitioning:
|
||||
type: day
|
||||
field: timestamp
|
||||
require_partition_filter: false
|
||||
|
|
Некоторые файлы не были показаны из-за слишком большого количества измененных файлов Показать больше
Загрузка…
Ссылка в новой задаче