diff --git a/data_quality/main.py b/data_quality/main.py index f66b6ae..633d05d 100644 --- a/data_quality/main.py +++ b/data_quality/main.py @@ -25,6 +25,10 @@ def run(config_file_path, deploy, encoding): utilities.set_up_cache_dir(config['cache_dir']) source_filepath = os.path.join(config['data_dir'], config['source_file']) + if config['assess_timeliness'] is True: + extractor = tasks.extract_relevance_period.RelevancePeriodExtractor(config) + extractor.run() + aggregator = tasks.Aggregator(config) if deploy: diff --git a/data_quality/tasks/aggregate.py b/data_quality/tasks/aggregate.py index f814617..669b031 100644 --- a/data_quality/tasks/aggregate.py +++ b/data_quality/tasks/aggregate.py @@ -50,11 +50,6 @@ def __init__(self, config, **kwargs): def run(self, pipeline): """Run on a Pipeline instance.""" - if self.assess_timeliness: - extractor = RelevancePeriodExtractor(self.config) - extractor.run() - self.lookup = self.get_lookup() - with compat.UnicodeAppender(self.result_file, quoting=csv.QUOTE_MINIMAL) as result_file: source = self.get_source(pipeline.data_source) result_id = compat.str(uuid.uuid4().hex)