Correct BigQuery partitioning/clustering metadata in ETL `metadata.yaml` files (#3500)

* Add missing BigQuery partitioning/clustering metadata.
* Correct existing BigQuery partitioning/clustering metadata.
* Allow partition `field` metadata field to be omitted.
* List partition `type` metadata field first.
This commit is contained in:
Sean Rose 2023-01-12 13:58:53 -08:00 коммит произвёл GitHub
Родитель 6978139496
Коммит 495ddcf39f
Не найден ключ, соответствующий данной подписи
Идентификатор ключа GPG: 4AEE18F83AFDEB23
220 изменённых файлов: 1011 добавлений и 96 удалений

Просмотреть файл

@ -57,8 +57,8 @@ class PartitionType(enum.Enum):
class PartitionMetadata:
"""Metadata for defining BigQuery table partitions."""
field: str
type: PartitionType
field: Optional[str] = attr.ib(None)
require_partition_filter: bool = attr.ib(True)
expiration_days: Optional[float] = attr.ib(None)

Просмотреть файл

@ -58,8 +58,8 @@ owners:
- wlachance@mozilla.com
bigquery:
time_partitioning:
field: date
type: day
field: date
require_partition_filter: true
expiration_days: null
clustering:
@ -91,8 +91,8 @@ owners:
- wlachance@mozilla.com
bigquery:
time_partitioning:
field: date
type: day
field: date
require_partition_filter: true
expiration_days: null
clustering:

Просмотреть файл

@ -25,3 +25,8 @@ scheduling:
# explicit query file path is necessary because the destination table
# includes a partition identifier that is not in the path
sql/moz-fx-cjms-nonprod-9a36/cjms_bigquery/flows_v1/query.sql
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -9,3 +9,8 @@ labels:
scheduling:
dag_name: bqetl_subplat
query_project: moz-fx-data-shared-prod
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,8 @@ owners:
scheduling:
dag_name: bqetl_experiments_daily
referenced_tables: [['region-us', 'INFORMATION_SCHEMA', 'JOBS_BY_PROJECT']]
bigquery:
time_partitioning:
type: day
field: submission_timestamp
require_partition_filter: false

Просмотреть файл

@ -21,13 +21,12 @@ scheduling:
bigquery:
time_partitioning:
field: last_modified_date
type: day
field: last_modified_date
require_partition_filter: false
clustering:
fields:
- double_opt_in
- has_opted_out_of_email
- double_opt_in
- email_lang
- mailing_country
- cohort

Просмотреть файл

@ -34,6 +34,12 @@ scheduling:
bigquery:
time_partitioning:
field: last_modified_date
type: day
field: last_modified_date
require_partition_filter: false
clustering:
fields:
- has_opted_out_of_email
- double_opt_in
- email_lang
- mailing_country

Просмотреть файл

@ -24,13 +24,12 @@ scheduling:
bigquery:
time_partitioning:
field: last_modified_date
type: day
field: last_modified_date
require_partition_filter: false
clustering:
fields:
- double_opt_in
- has_opted_out_of_email
- double_opt_in
- email_lang
- mailing_country
- cohort

Просмотреть файл

@ -37,6 +37,11 @@ scheduling:
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- event_type
- recipient_type
- body_type

Просмотреть файл

@ -24,8 +24,8 @@ scheduling:
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:

Просмотреть файл

@ -10,3 +10,14 @@ scheduling:
referenced_tables:
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_goals_v1']
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_sessions_v1']
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- country
- browser
- blog
- subblog

Просмотреть файл

@ -9,3 +9,8 @@ scheduling:
dag_name: bqetl_google_analytics_derived
referenced_tables:
- ['moz-fx-data-marketing-prod', 'ga_derived', 'blogs_empty_check_v1']
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false

Просмотреть файл

@ -11,3 +11,14 @@ scheduling:
referenced_tables:
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_goals_v1"]
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_sessions_v1"]
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- cleaned_landing_page
- browser
- blog
- subblog

Просмотреть файл

@ -10,3 +10,8 @@ scheduling:
dag_name: bqetl_google_analytics_derived
referenced_tables:
- ["moz-fx-data-marketing-prod", "ga_derived", "blogs_empty_check_v1"]
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,8 @@ owners:
- ascholtz@mozilla.com
scheduling:
dag_name: bqetl_google_analytics_derived
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,14 @@ owners:
- ascholtz@mozilla.com
scheduling:
dag_name: bqetl_google_analytics_derived
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- page_name
- event_category
- event_action
- event_label

Просмотреть файл

@ -9,3 +9,8 @@ scheduling:
dag_name: bqetl_google_analytics_derived
referenced_tables:
- ['moz-fx-data-marketing-prod', 'ga_derived', 'www_site_empty_check_v1']
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,14 @@ owners:
- ascholtz@mozilla.com
scheduling:
dag_name: bqetl_google_analytics_derived
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- page_name
- country
- locale
- medium

Просмотреть файл

@ -7,3 +7,14 @@ owners:
- ascholtz@mozilla.com
scheduling:
dag_name: bqetl_google_analytics_derived
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- country
- browser
- source
- medium

Просмотреть файл

@ -7,3 +7,14 @@ owners:
- ascholtz@mozilla.com
scheduling:
dag_name: bqetl_google_analytics_derived
bigquery:
time_partitioning:
type: day
field: date
require_partition_filter: false
clustering:
fields:
- page_name
- country
- locale
- medium

Просмотреть файл

@ -13,6 +13,6 @@ scheduling:
depends_on_past: true
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -16,6 +16,6 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -18,6 +18,6 @@ scheduling:
bigquery:
time_partitioning:
field: submission_date
type: day
field: date
require_partition_filter: false

Просмотреть файл

@ -10,6 +10,15 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_activity_stream
bigquery:
time_partitioning:
type: day
field: submission_timestamp
require_partition_filter: true
expiration_days: 180
clustering:
fields:
- experiment_id
workgroup_access:
- role: roles/bigquery.dataViewer
members:

Просмотреть файл

@ -8,6 +8,16 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_activity_stream
bigquery:
time_partitioning:
type: day
field: submission_timestamp
require_partition_filter: true
expiration_days: 180
clustering:
fields:
- release_channel
- sample_id
workgroup_access:
- role: roles/bigquery.dataViewer
members:

Просмотреть файл

@ -10,3 +10,11 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_amo_stats
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- addon_id

Просмотреть файл

@ -10,3 +10,11 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_amo_stats
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- hashed_addon_id

Просмотреть файл

@ -15,3 +15,11 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_amo_stats
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- addon_id

Просмотреть файл

@ -15,3 +15,11 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_amo_stats
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- hashed_addon_id

Просмотреть файл

@ -15,3 +15,11 @@ scheduling:
# query to get it, and that would be slow because main_v4 is referenced
referenced_tables: [['moz-fx-data-shared-prod', 'telemetry_stable',
'main_v4']]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- sample_id

Просмотреть файл

@ -12,3 +12,11 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_amo_stats
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- sample_id

Просмотреть файл

@ -10,7 +10,7 @@ scheduling:
dag_name: bqetl_ctxsvc_derived
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
expiration_days: null

Просмотреть файл

@ -8,5 +8,9 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_ctxsvc_derived
bigquery: null
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
references: {}

Просмотреть файл

@ -8,5 +8,9 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_ctxsvc_derived
bigquery: null
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
references: {}

Просмотреть файл

@ -9,3 +9,12 @@ labels:
scheduling:
dag_name: bqetl_ctxsvc_derived
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- source
- event_type

Просмотреть файл

@ -13,8 +13,8 @@ labels:
bigquery:
time_partitioning:
field: submission_date
type: month
field: submission_date
require_partition_filter: true
scheduling:

Просмотреть файл

@ -26,9 +26,9 @@ scheduling:
execution_delta: 0h
bigquery:
time_partitioning:
field: submission_date
type: day
require_partition_filter: true
field: submission_date
require_partition_filter: false
clustering:
fields:
- adjust_network

Просмотреть файл

@ -22,8 +22,8 @@ scheduling:
execution_delta: 1h
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:

Просмотреть файл

@ -17,3 +17,12 @@ labels:
scheduling:
dag_name: bqetl_fenix_event_rollup
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- category
- event

Просмотреть файл

@ -20,3 +20,11 @@ scheduling:
'event_types_v1'
],
]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- sample_id

Просмотреть файл

@ -43,8 +43,8 @@ scheduling:
- submission_date:DATE:{{ds}}
bigquery:
time_partitioning:
field: first_seen_date
type: day
field: first_seen_date
require_partition_filter: false
clustering:
fields:

Просмотреть файл

@ -7,8 +7,8 @@ labels:
incremental: true
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
expiration_days: null
clustering:

Просмотреть файл

@ -14,8 +14,8 @@ scheduling:
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
bigquery:
time_partitioning:
field: date
type: day
field: date
require_partition_filter: false
expiration_days: null
clustering: null

Просмотреть файл

@ -13,8 +13,8 @@ scheduling:
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
bigquery:
time_partitioning:
field: date
type: day
field: date
require_partition_filter: false
expiration_days: null
clustering: null

Просмотреть файл

@ -17,3 +17,12 @@ labels:
scheduling:
dag_name: bqetl_event_rollup
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- category
- event

Просмотреть файл

@ -20,3 +20,11 @@ scheduling:
'event_types_v1'
],
]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- sample_id

Просмотреть файл

@ -9,3 +9,8 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_fxa_events
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -13,4 +13,8 @@ scheduling:
dag_name: bqetl_event_rollup
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
task_name: funnel_events_source__v1
bigquery: null
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -9,3 +9,11 @@ labels:
application: fxa
incremental: true
schedule: daily
bigquery:
time_partitioning:
type: day
field: submission_date_pacific
require_partition_filter: false
clustering:
fields:
- user_id

Просмотреть файл

@ -15,3 +15,8 @@ labels:
# dag_name: bqetl_fxa_events
# arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
# referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false

Просмотреть файл

@ -11,3 +11,8 @@ scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: true

Просмотреть файл

@ -11,3 +11,8 @@ scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false

Просмотреть файл

@ -16,3 +16,8 @@ scheduling:
# depends only on fxa logs produced via Stackdriver integration, so no other
# scheduled tasks are involved and the referenced_tables list is empty.
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: submission_timestamp
require_partition_filter: false

Просмотреть файл

@ -14,3 +14,11 @@ labels:
scheduling:
dag_name: bqetl_fxa_events
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false
clustering:
fields:
- event

Просмотреть файл

@ -14,3 +14,11 @@ labels:
scheduling:
dag_name: bqetl_fxa_events
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false
clustering:
fields:
- event

Просмотреть файл

@ -17,3 +17,11 @@ scheduling:
# depends only on fxa logs produced via Stackdriver integration, so no other
# scheduled tasks are involved and the referenced_tables list is empty.
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false
clustering:
fields:
- command

Просмотреть файл

@ -10,3 +10,8 @@ labels:
scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false

Просмотреть файл

@ -15,8 +15,8 @@ scheduling:
dag_name: bqetl_fxa_events
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:

Просмотреть файл

@ -21,8 +21,8 @@ scheduling:
- submission_date:DATE:{{ds}}
bigquery:
time_partitioning:
field: first_seen_date
type: day
field: first_seen_date
require_partition_filter: false
clustering:
fields:

Просмотреть файл

@ -21,8 +21,8 @@ scheduling:
start_date: '2019-04-23'
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
expiration_days: null
clustering:

Просмотреть файл

@ -10,3 +10,12 @@ labels:
scheduling:
dag_name: bqetl_fxa_events
date_partition_parameter: submission_date
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- service
- user_id

Просмотреть файл

@ -24,8 +24,8 @@ scheduling:
date_partition_parameter: submission_date
bigquery:
time_partitioning:
field: timestamp
type: day
field: timestamp
require_partition_filter: true
clustering:
fields:

Просмотреть файл

@ -25,8 +25,8 @@ scheduling:
]
bigquery:
time_partitioning:
field: first_seen_date
type: day
field: first_seen_date
require_partition_filter: true
clustering:
fields:

Просмотреть файл

@ -22,8 +22,8 @@ scheduling:
]
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:

Просмотреть файл

@ -15,3 +15,12 @@ labels:
# # making it incremental is possible but nuanced since it windows over
# # events that may cross the midnight boundary.
# date_partition_parameter: null
bigquery:
time_partitioning:
type: day
field: first_service_timestamp
require_partition_filter: false
clustering:
fields:
- service
- user_id

Просмотреть файл

@ -14,3 +14,12 @@ labels:
# dag_name: bqetl_fxa_events
# depends_on_past: true
# start_date: '2019-10-08'
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- service
- user_id

Просмотреть файл

@ -12,3 +12,8 @@ scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: true

Просмотреть файл

@ -12,3 +12,8 @@ scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
referenced_tables: []
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: true

Просмотреть файл

@ -11,3 +11,8 @@ labels:
scheduling:
dag_name: bqetl_fxa_events
arguments: ['--schema_update_option=ALLOW_FIELD_ADDITION']
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: true

Просмотреть файл

@ -7,8 +7,8 @@ labels:
incremental: true
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true
expiration_days: null
clustering:

Просмотреть файл

@ -76,8 +76,8 @@ scheduling:
- health_v4
bigquery:
time_partitioning:
field: datetime
type: day
field: datetime
require_partition_filter: null
clustering:
fields:

Просмотреть файл

@ -8,3 +8,8 @@ labels:
incremental: true
scheduling:
dag_name: bqetl_messaging_system
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,11 @@ labels:
incremental: true
scheduling:
dag_name: bqetl_messaging_system
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- release_channel

Просмотреть файл

@ -10,3 +10,11 @@ labels:
scheduling:
dag_name: bqetl_messaging_system
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- release_channel

Просмотреть файл

@ -17,3 +17,12 @@ labels:
scheduling:
dag_name: bqetl_event_rollup
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- category
- event

Просмотреть файл

@ -20,3 +20,11 @@ scheduling:
'event_types_v1'
],
]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- sample_id

Просмотреть файл

@ -10,3 +10,8 @@ labels:
scheduling:
dag_name: bqetl_messaging_system
task_name: messaging_system_onboarding_exact_mau28_by_dimensions
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,11 @@ labels:
incremental: true
scheduling:
dag_name: bqetl_messaging_system
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- release_channel

Просмотреть файл

@ -10,3 +10,11 @@ labels:
scheduling:
dag_name: bqetl_messaging_system
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- release_channel

Просмотреть файл

@ -10,3 +10,8 @@ labels:
scheduling:
dag_name: bqetl_messaging_system
task_name: messaging_system_snippets_exact_mau28_by_dimensions
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -7,3 +7,11 @@ labels:
incremental: true
scheduling:
dag_name: bqetl_messaging_system
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- release_channel

Просмотреть файл

@ -10,3 +10,11 @@ labels:
scheduling:
dag_name: bqetl_messaging_system
depends_on_past: true
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: true
clustering:
fields:
- release_channel

Просмотреть файл

@ -10,3 +10,8 @@ scheduling:
referenced_tables:
- ['moz-fx-data-shared-prod', 'monitoring_derived', 'stable_table_sizes_v1']
- ['moz-fx-data-shared-prod', '*_stable', "*"]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -9,3 +9,8 @@ owners:
scheduling:
dag_name: bqetl_monitoring
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -10,3 +10,8 @@ owners:
scheduling:
dag_name: bqetl_monitoring
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -10,6 +10,6 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
field: change_date
type: day
field: change_date
require_partition_filter: true

Просмотреть файл

@ -10,5 +10,6 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: true

Просмотреть файл

@ -10,6 +10,6 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
bigquery:
time_partitioning:
field: creation_date
type: day
field: creation_date
require_partition_filter: true

Просмотреть файл

@ -10,3 +10,8 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
referenced_tables:
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -18,3 +18,8 @@ scheduling:
- ['moz-fx-data-shared-prod',
'monitoring',
'payload_bytes_decoded_telemetry']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -9,3 +9,14 @@ labels:
incremental: true
scheduling:
dag_name: bqetl_monitoring
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false
clustering:
fields:
- document_namespace
- document_type
- path
- job_name

Просмотреть файл

@ -15,3 +15,8 @@ scheduling:
- ['moz-fx-data-shared-prod', '*_stable', '*']
- ['moz-fx-data-shared-prod', 'telemetry_stable', 'main_v4']
- ['moz-fx-data-shared-prod', '*_derived', '*']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -15,6 +15,6 @@ scheduling:
parameters: ["submission_date:DATE:{{ds}}"]
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -10,8 +10,8 @@ labels:
incremental: true
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false
scheduling:
dag_name: bqetl_monitoring

Просмотреть файл

@ -12,3 +12,8 @@ scheduling:
arguments: ["--date", "{{ ds }}"]
referenced_tables:
- ['moz-fx-data-shared-prod', '*_stable', '*']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -10,8 +10,8 @@ labels:
incremental: true
bigquery:
time_partitioning:
field: submission_date
type: day
field: submission_date
require_partition_filter: false
scheduling:
dag_name: bqetl_monitoring

Просмотреть файл

@ -12,3 +12,8 @@ scheduling:
dag_name: bqetl_monitoring
referenced_tables:
- ['moz-fx-data-shared-prod', '*_stable', '*']
bigquery:
time_partitioning:
type: day
field: submission_date
require_partition_filter: false

Просмотреть файл

@ -14,3 +14,8 @@ scheduling:
# delay aggregates by 7 days, to ensure data is complete
date_partition_offset: -7
date_partition_parameter: date
bigquery:
time_partitioning:
type: day
field: active_date
require_partition_filter: false

Просмотреть файл

@ -11,3 +11,8 @@ scheduling:
# delay aggregates by 7 days, to ensure data is complete
date_partition_offset: -7
date_partition_parameter: date
bigquery:
time_partitioning:
type: day
field: active_date
require_partition_filter: false

Просмотреть файл

@ -8,3 +8,8 @@ labels:
schedule: daily
scheduling:
dag_name: bqetl_subplat
bigquery:
time_partitioning:
type: day
field: timestamp
require_partition_filter: false

Некоторые файлы не были показаны из-за слишком большого количества измененных файлов Показать больше