examples.scripts.sample_dq_delta.current_dir = os.path.dirname(os.path.abspath(__file__))
module-attribute
¶examples.scripts.sample_dq_delta.dic_job_info = {'job': 'job_name', 'Region': 'NA', 'env': 'dev', 'Snapshot': '2024-04-15', 'data_object_name ': 'customer_order'}
module-attribute
¶examples.scripts.sample_dq_delta.job_info = str(dic_job_info)
module-attribute
¶examples.scripts.sample_dq_delta.se: SparkExpectations = SparkExpectations(product_id='your_product', rules_df=spark.table('dq_spark_dev.dq_rules'), stats_table='dq_spark_dev.dq_stats', stats_table_writer=writer, target_and_error_table_writer=writer, debugger=False, stats_streaming_options={user_config.se_enable_streaming: False})
module-attribute
¶examples.scripts.sample_dq_delta.spark = set_up_delta()
module-attribute
¶examples.scripts.sample_dq_delta.user_conf: Dict[str, Union[str, int, bool, Dict[str, str]]] = {user_config.se_notifications_smtp_password: 'w*******', user_config.se_notifications_smtp_creds_dict: {user_config.secret_type: 'cerberus', user_config.cbs_url: 'https://cerberus.example.com', user_config.cbs_sdb_path: 'your_sdb_path', user_config.cbs_smtp_password: 'your_smtp_password'}, user_config.se_notifications_enable_smtp_server_auth: False, user_config.se_enable_obs_dq_report_result: False, user_config.se_dq_obs_alert_flag: False, user_config.se_dq_obs_default_email_template: '', user_config.se_notifications_enable_email: False, user_config.se_notifications_enable_custom_email_body: False, user_config.se_notifications_email_smtp_host: 'smtp.office365.com', user_config.se_notifications_email_smtp_port: 587, user_config.se_notifications_email_from: 'a.dsm.*****.com', user_config.se_notifications_email_to_other_mail_id: 'abc@mail.com', user_config.se_notifications_email_subject: 'spark expectations - data quality - notifications', user_config.se_notifications_email_custom_body: "Spark Expectations Statistics for this dq run:\n 'product_id': {},\n 'table_name': {},\n 'source_agg_dq_results': {}',\n 'dq_status': {}", user_config.se_notifications_enable_slack: False, user_config.se_notifications_slack_webhook_url: '', user_config.se_notifications_on_start: False, user_config.se_notifications_on_completion: False, user_config.se_notifications_on_fail: False, user_config.se_notifications_on_error_drop_exceeds_threshold_breach: True, user_config.se_notifications_on_error_drop_threshold: 15, user_config.se_enable_query_dq_detailed_result: True, user_config.se_enable_agg_dq_detailed_result: True, user_config.se_enable_error_table: True, user_config.se_dq_rules_params: {'env': 'dev', 'table': 'product', 'data_object_name': 'customer_order', 'data_source': 'customer_source', 'data_layer': 'Integrated'}, user_config.se_job_metadata: job_info}
module-attribute
¶examples.scripts.sample_dq_delta.writer = WrappedDataFrameWriter().mode('append').format('delta')
module-attribute
¶examples.scripts.sample_dq_delta.build_new() -> DataFrame
¶examples/scripts/sample_dq_delta.py