Skip to content
This repository has been archived by the owner on May 26, 2021. It is now read-only.

Commit

Permalink
Extract period before aggregate
Browse files Browse the repository at this point in the history
  • Loading branch information
georgiana-b committed Jul 30, 2016
1 parent 33651d1 commit 27d00db
Show file tree
Hide file tree
Showing 2 changed files with 4 additions and 5 deletions.
4 changes: 4 additions & 0 deletions data_quality/main.py
Original file line number Diff line number Diff line change
Expand Up @@ -25,6 +25,10 @@ def run(config_file_path, deploy, encoding):
utilities.set_up_cache_dir(config['cache_dir'])
source_filepath = os.path.join(config['data_dir'], config['source_file'])

if config['assess_timeliness'] is True:
extractor = tasks.extract_relevance_period.RelevancePeriodExtractor(config)
extractor.run()

aggregator = tasks.Aggregator(config)

if deploy:
Expand Down
5 changes: 0 additions & 5 deletions data_quality/tasks/aggregate.py
Original file line number Diff line number Diff line change
Expand Up @@ -50,11 +50,6 @@ def __init__(self, config, **kwargs):
def run(self, pipeline):
"""Run on a Pipeline instance."""

if self.assess_timeliness:
extractor = RelevancePeriodExtractor(self.config)
extractor.run()
self.lookup = self.get_lookup()

with compat.UnicodeAppender(self.result_file, quoting=csv.QUOTE_MINIMAL) as result_file:
source = self.get_source(pipeline.data_source)
result_id = compat.str(uuid.uuid4().hex)
Expand Down

0 comments on commit 27d00db

Please sign in to comment.