For context, I wasn’t able to perform a simple gx.get_context()
as it wasn’t able to find the initialized great_expectations.yaml file as I accidentally deleted it and even when i restore it, it can’t detect the changes I have made on the new great_expectations.yaml.
The resolution is to point the Data Context to the file path i’m working on so it looks like this:
import os
import great_expectations as gx
context = gx.get_context(context_root_dir = os.getcwd())
In this step while fetching get_context, it is taking a long time > 5mins on my local machine.
My great_expectations.yaml looks something like this:
{
"anonymous_usage_statistics": {
"data_context_id": "a1ee0e05-e914-4b92-8a16-9092622492f3",
"explicit_id": true,
"explicit_url": false,
"usage_statistics_url": "https://stats.greatexpectations.io/great_expectations/v1/usage_statistics",
"enabled": true
},
"checkpoint_store_name": "checkpoint_store",
"config_variables_file_path": "config_variables.yml",
"config_version": 3.0,
"data_docs_sites": {
"local_site": {
"class_name": "SiteBuilder",
"show_how_to_buttons": true,
"store_backend": {
"class_name": "TupleFilesystemStoreBackend",
"base_directory": "uncommitted/data_docs/local_site/"
},
"site_index_builder": {
"class_name": "DefaultSiteIndexBuilder"
}
},
"s3_site": {
"class_name": "SiteBuilder",
"store_backend": {
"class_name": "TupleS3StoreBackend",
"bucket": "<>",
"prefix": "data_doc"
},
"site_index_builder": {
"class_name": "DefaultSiteIndexBuilder",
"validation_results_limit": 10,
"show_cta_footer": true
}
}
},
"datasources": {},
"evaluation_parameter_store_name": "evaluation_parameter_store",
"expectations_store_name": "expectations_S3_store",
"fluent_datasources": {},
"include_rendered_content": {
"expectation_suite": false,
"expectation_validation_result": false,
"globally": false
},
"plugins_directory": "plugins/",
"stores": {
"expectations_store": {
"class_name": "ExpectationsStore",
"store_backend": {
"class_name": "TupleFilesystemStoreBackend",
"base_directory": "expectations/"
}
},
"expectations_S3_store": {
"class_name": "ExpectationsStore",
"store_backend": {
"class_name": "TupleS3StoreBackend",
"bucket": "<>",
"prefix": "expectation_store"
}
},
"validations_store": {
"class_name": "ValidationsStore",
"store_backend": {
"class_name": "TupleFilesystemStoreBackend",
"base_directory": "uncommitted/validations/"
}
},
"validations_S3_store": {
"class_name": "ValidationsStore",
"store_backend": {
"class_name": "TupleS3StoreBackend",
"bucket": "<>",
"prefix": "validation_result_store"
}
},
"evaluation_parameter_store": {
"class_name": "EvaluationParameterStore"
},
"checkpoint_store": {
"class_name": "CheckpointStore",
"store_backend": {
"class_name": "TupleFilesystemStoreBackend",
"suppress_store_backend_id": true,
"base_directory": "checkpoints/"
}
},
"profiler_store": {
"class_name": "ProfilerStore",
"store_backend": {
"class_name": "TupleFilesystemStoreBackend",
"suppress_store_backend_id": true,
"base_directory": "profilers/"
}
}
},
"validations_store_name": "validations_S3_store"
}
Is this normal if it is trying to access S3?