From 498c989e58e7b3f2f5724341f2f9ad7fce959d41 Mon Sep 17 00:00:00 2001 From: thoppe Date: Sun, 27 Sep 2015 20:56:16 -0400 Subject: [PATCH] Added search data collater --- collate_search_data.py | 24 ++++++++++++++++++++++++ run_fixer.py | 3 ++- src/__init__.py | 0 word_fix.py => src/word_fix.py | 3 --- 4 files changed, 26 insertions(+), 4 deletions(-) create mode 100644 collate_search_data.py create mode 100644 src/__init__.py rename word_fix.py => src/word_fix.py (99%) diff --git a/collate_search_data.py b/collate_search_data.py new file mode 100644 index 0000000..f7354c4 --- /dev/null +++ b/collate_search_data.py @@ -0,0 +1,24 @@ +import os, glob, json, codecs + +F_SEARCH = sorted(glob.glob("search_data/*")) + +def load_word_file(f): + with codecs.open(f,'r','utf-8') as FIN: + js = json.loads(FIN.read()) + return js + +for f in F_SEARCH: + js = load_word_file(f) + + try: + js["items"] = [item["full_name"] for item in js["items"]] + except: + print "{} looks to be collated already".format(f) + continue + + with codecs.open(f,'w','utf-8') as FOUT: + FOUT.write(json.dumps(js)) + + print "Completed {}".format(f) + + diff --git a/run_fixer.py b/run_fixer.py index 540bfaf..159fd04 100644 --- a/run_fixer.py +++ b/run_fixer.py @@ -1,4 +1,5 @@ - +import os, glob +from src.word_fix import fix_word ''' def load_word_file(f): diff --git a/src/__init__.py b/src/__init__.py new file mode 100644 index 0000000..e69de29 diff --git a/word_fix.py b/src/word_fix.py similarity index 99% rename from word_fix.py rename to src/word_fix.py index a46fa26..46a7eeb 100644 --- a/word_fix.py +++ b/src/word_fix.py @@ -4,9 +4,6 @@ logging.basicConfig(level=logging.INFO) logging.getLogger("requests").setLevel(logging.WARNING) -## TO DO: -## LOG AS COMPLETE! - FLAG_fork = True FLAG_delete = True