examples.scripts.sample_dq_bigquery.current_dir = os.path.dirname(os.path.abspath(__file__))
module-attribute
¶examples.scripts.sample_dq_bigquery.dic_job_info = {'job': 'job_name', 'Region': 'NA', 'Snapshot': '2024-04-15'}
module-attribute
¶examples.scripts.sample_dq_bigquery.job_info = str(dic_job_info)
module-attribute
¶examples.scripts.sample_dq_bigquery.se: SparkExpectations = SparkExpectations(product_id='your_product', rules_df=spark.read.format('bigquery').load('<project_id>.<dataset_id>.<rules_table>'), stats_table='<project_id>.<dataset_id>.<stats_table>', stats_table_writer=writer, target_and_error_table_writer=writer, debugger=False)
module-attribute
¶examples.scripts.sample_dq_bigquery.spark = set_up_bigquery('<temp_dataset>')
module-attribute
¶examples.scripts.sample_dq_bigquery.user_conf: Dict[str, Union[str, int, bool, Dict[str, str]]] = {user_config.se_notifications_enable_email: False, user_config.se_notifications_email_smtp_host: 'mailhost.com', user_config.se_notifications_email_smtp_port: 25, user_config.se_notifications_email_from: '', user_config.se_notifications_email_to_other_mail_id: '', user_config.se_notifications_email_subject: 'spark expectations - data quality - notifications', user_config.se_notifications_enable_slack: False, user_config.se_notifications_slack_webhook_url: '', user_config.se_notifications_on_start: True, user_config.se_notifications_on_completion: True, user_config.se_notifications_on_fail: True, user_config.se_notifications_on_error_drop_exceeds_threshold_breach: True, user_config.se_notifications_on_error_drop_threshold: 15, user_config.se_enable_query_dq_detailed_result: True, user_config.se_enable_agg_dq_detailed_result: True, user_config.se_enable_error_table: True, user_config.se_dq_rules_params: {'env': 'local', 'table': 'product'}, user_config.se_job_metadata: job_info}
module-attribute
¶examples.scripts.sample_dq_bigquery.writer = WrappedDataFrameWriter().mode('overwrite').format('bigquery').option('createDisposition', 'CREATE_IF_NEEDED').option('writeMethod', 'direct')
module-attribute
¶examples.scripts.sample_dq_bigquery.build_new() -> DataFrame
¶examples/scripts/sample_dq_bigquery.py