In [1]:
import json
import requests
from os import makedirs
from os.path import join, exists
from datetime import date, timedelta

In [2]:

def get_news_by_date_range(query_terms, query_fields, show_fields, start_date, end_date, subdir, year):

    ARTICLES_DIR = join('data', 'guardian', subdir, year)
    makedirs(ARTICLES_DIR, exist_ok=True)

    MY_API_KEY = open("creds_guardian.txt").read().strip()
    API_ENDPOINT = 'http://content.guardianapis.com/search'
    my_params = {
        'from-date': "",
        'to-date': "",
        'order-by': "newest",
        'edition': 'US',
        'show-fields': show_fields,
        'q': query_terms,
        'query-fields': query_fields,
        'sectionName': 'politics',
        'page-size': 200,
        'api-key': MY_API_KEY
    }

    # day iteration from here:
    # http://stackoverflow.com/questions/7274267/print-all-day-dates-between-two-dates
    
    dayrange = range((end_date - start_date).days + 1)
    
    for daycount in dayrange:
        dt = start_date + timedelta(days=daycount)
        datestr = dt.strftime('%Y-%m-%d')
        fname_h = join(ARTICLES_DIR, datestr + '.json')
        fname_b = join(ARTICLES_DIR, datestr + '-b.json')
        
        if not exists(fname_h):
            # then let's download it
            print("Downloading", datestr)
            all_results_h = []
            all_results_b = []
            
            my_params['from-date'] = datestr
            my_params['to-date'] = datestr
            current_page = 1
            total_pages = 1
            while current_page <= total_pages:
                #print("...page", current_page)
                my_params['page'] = current_page
                resp = requests.get(API_ENDPOINT, my_params)
                data = resp.json()
                #all_results.extend(data['response']['results'])
                for result in data['response']['results']:

                    if(len(result['fields']['headline']) > 0):
                        #print(result['fields'][get_field])
                        all_results_h.append(result['fields']['headline'])
                        
                    if(len(result['fields']['body']) > 0):
                        #print(result['fields'][get_field])
                        all_results_b.append(result['fields']['body'])

                # if there is more than one page
                current_page += 1
                total_pages = data['response']['pages']

            with open(fname_h, 'w') as f:
                print("Writing to", fname_h)

                # re-serialize it for pretty indentation
                f.write(json.dumps(all_results_h, indent=2))
                
            with open(fname_b, 'w') as f:
                #print("Writing to", fname_b)

                # re-serialize it for pretty indentation
                f.write(json.dumps(all_results_b, indent=2))

In [3]:
search_key_2016 = '(president OR election) OR (donald OR trump OR hillary OR clinton OR barak OR obama)' 
search_key_2012 = '(president OR election) OR (romney OR mitt OR barak OR obama)' 
search_key_2008 = '(president OR election) OR (mccain OR john OR barak OR obama)' 
search_key_2004 = '(president OR election) OR (bush OR george OR john OR kerry)' 
search_key_2000 = '(president OR election) OR (bush OR george OR gore OR clinton OR bill)' 
search_key_2020 = '(president OR election) OR (donald OR trump OR hillary OR clinton OR joe OR biden)' 

get_news_by_date_range(search_key_2016, 'headline,body', 'headline,body,sectionName',
                        date(2016, 8, 8), date(2016, 11, 8), 'candidates', '2016')

get_news_by_date_range(search_key_2012, 'headline,body', 'headline,body,sectionName',
                       date(2012, 8, 6), date(2012, 11, 6), 'candidates', '2012')

get_news_by_date_range(search_key_2008, 'headline,body', 'headline,body,sectionName',
                       date(2008, 8, 4), date(2008, 11, 4), 'candidates', '2008')

get_news_by_date_range(search_key_2004, 'headline,body', 'headline,body,sectionName',
                       date(2004, 8, 2), date(2004, 11, 2), 'candidates', '2004')

get_news_by_date_range(search_key_2000, 'headline,body', 'headline,body,sectionName',
                       date(2000, 8, 7), date(2000, 11, 7), 'candidates', '2000')

get_news_by_date_range(search_key_2020, 'headline,body', 'headline,body,sectionName',
                       date(2020, 3, 12), date(2020, 6, 12), 'candidates', '2020')

Downloading 2012-08-06
Writing to data/guardian/2012/2012-08-06.json
Downloading 2012-08-07
Writing to data/guardian/2012/2012-08-07.json
Downloading 2012-08-08
Writing to data/guardian/2012/2012-08-08.json
Downloading 2012-08-09
Writing to data/guardian/2012/2012-08-09.json
Downloading 2012-08-10
Writing to data/guardian/2012/2012-08-10.json
Downloading 2012-08-11
Writing to data/guardian/2012/2012-08-11.json
Downloading 2012-08-12
Writing to data/guardian/2012/2012-08-12.json
Downloading 2012-08-13
Writing to data/guardian/2012/2012-08-13.json
Downloading 2012-08-14
Writing to data/guardian/2012/2012-08-14.json
Downloading 2012-08-15
Writing to data/guardian/2012/2012-08-15.json
Downloading 2012-08-16
Writing to data/guardian/2012/2012-08-16.json
Downloading 2012-08-17
Writing to data/guardian/2012/2012-08-17.json
Downloading 2012-08-18
Writing to data/guardian/2012/2012-08-18.json
Downloading 2012-08-19
Writing to data/guardian/2012/2012-08-19.json
Downloading 2012-08-20
Writing to 

Writing to data/guardian/2008/2008-08-30.json
Downloading 2008-08-31
Writing to data/guardian/2008/2008-08-31.json
Downloading 2008-09-01
Writing to data/guardian/2008/2008-09-01.json
Downloading 2008-09-02
Writing to data/guardian/2008/2008-09-02.json
Downloading 2008-09-03
Writing to data/guardian/2008/2008-09-03.json
Downloading 2008-09-04
Writing to data/guardian/2008/2008-09-04.json
Downloading 2008-09-05
Writing to data/guardian/2008/2008-09-05.json
Downloading 2008-09-06
Writing to data/guardian/2008/2008-09-06.json
Downloading 2008-09-07
Writing to data/guardian/2008/2008-09-07.json
Downloading 2008-09-08
Writing to data/guardian/2008/2008-09-08.json
Downloading 2008-09-09
Writing to data/guardian/2008/2008-09-09.json
Downloading 2008-09-10
Writing to data/guardian/2008/2008-09-10.json
Downloading 2008-09-11
Writing to data/guardian/2008/2008-09-11.json
Downloading 2008-09-12
Writing to data/guardian/2008/2008-09-12.json
Downloading 2008-09-13
Writing to data/guardian/2008/2008

Writing to data/guardian/2004/2004-09-23.json
Downloading 2004-09-24
Writing to data/guardian/2004/2004-09-24.json
Downloading 2004-09-25
Writing to data/guardian/2004/2004-09-25.json
Downloading 2004-09-26
Writing to data/guardian/2004/2004-09-26.json
Downloading 2004-09-27
Writing to data/guardian/2004/2004-09-27.json
Downloading 2004-09-28
Writing to data/guardian/2004/2004-09-28.json
Downloading 2004-09-29
Writing to data/guardian/2004/2004-09-29.json
Downloading 2004-09-30
Writing to data/guardian/2004/2004-09-30.json
Downloading 2004-10-01
Writing to data/guardian/2004/2004-10-01.json
Downloading 2004-10-02
Writing to data/guardian/2004/2004-10-02.json
Downloading 2004-10-03
Writing to data/guardian/2004/2004-10-03.json
Downloading 2004-10-04
Writing to data/guardian/2004/2004-10-04.json
Downloading 2004-10-05
Writing to data/guardian/2004/2004-10-05.json
Downloading 2004-10-06
Writing to data/guardian/2004/2004-10-06.json
Downloading 2004-10-07
Writing to data/guardian/2004/2004

Writing to data/guardian/2000/2000-10-24.json
Downloading 2000-10-25
Writing to data/guardian/2000/2000-10-25.json
Downloading 2000-10-26
Writing to data/guardian/2000/2000-10-26.json
Downloading 2000-10-27
Writing to data/guardian/2000/2000-10-27.json
Downloading 2000-10-28
Writing to data/guardian/2000/2000-10-28.json
Downloading 2000-10-29
Writing to data/guardian/2000/2000-10-29.json
Downloading 2000-10-30
Writing to data/guardian/2000/2000-10-30.json
Downloading 2000-10-31
Writing to data/guardian/2000/2000-10-31.json
Downloading 2000-11-01
Writing to data/guardian/2000/2000-11-01.json
Downloading 2000-11-02
Writing to data/guardian/2000/2000-11-02.json
Downloading 2000-11-03
Writing to data/guardian/2000/2000-11-03.json
Downloading 2000-11-04
Writing to data/guardian/2000/2000-11-04.json
Downloading 2000-11-05
Writing to data/guardian/2000/2000-11-05.json
Downloading 2000-11-06
Writing to data/guardian/2000/2000-11-06.json
Downloading 2000-11-07
Writing to data/guardian/2000/2000

In [9]:
search_key_health = '(job OR unemployment OR race OR black OR white OR discrimination)' 

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                        date(2016, 8, 8), date(2016, 11, 8), 'jobs-race', '2016')

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                       date(2012, 8, 6), date(2012, 11, 6), 'jobs-race', '2012')

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                       date(2008, 8, 4), date(2008, 11, 4), 'jobs-race', '2008')

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                       date(2004, 8, 2), date(2004, 11, 2), 'jobs-race', '2004')

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                       date(2000, 8, 7), date(2000, 11, 7), 'jobs-race', '2000')

get_news_by_date_range(search_key_health, 'headline,body', 'headline,body,sectionName',
                       date(2020, 3, 12), date(2020, 6, 12), 'jobs-race', '2020')

Downloading 2016-08-08
Writing to data/guardian/jobs-race/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/jobs-race/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/jobs-race/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/jobs-race/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/jobs-race/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/jobs-race/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/jobs-race/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/jobs-race/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/jobs-race/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/jobs-race/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/jobs-race/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/jobs-race/2016/2016-08-19.json
Downloading 2016-08-20
Writing to data/guardian/jobs

Writing to data/guardian/jobs-race/2012/2012-08-17.json
Downloading 2012-08-18
Writing to data/guardian/jobs-race/2012/2012-08-18.json
Downloading 2012-08-19
Writing to data/guardian/jobs-race/2012/2012-08-19.json
Downloading 2012-08-20
Writing to data/guardian/jobs-race/2012/2012-08-20.json
Downloading 2012-08-21
Writing to data/guardian/jobs-race/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/jobs-race/2012/2012-08-22.json
Downloading 2012-08-23
Writing to data/guardian/jobs-race/2012/2012-08-23.json
Downloading 2012-08-24
Writing to data/guardian/jobs-race/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/jobs-race/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/jobs-race/2012/2012-08-26.json
Downloading 2012-08-27
Writing to data/guardian/jobs-race/2012/2012-08-27.json
Downloading 2012-08-28
Writing to data/guardian/jobs-race/2012/2012-08-28.json
Downloading 2012-08-29
Writing to data/guardian/jobs-race/2012/2012-08-29.j

Writing to data/guardian/jobs-race/2008/2008-08-26.json
Downloading 2008-08-27
Writing to data/guardian/jobs-race/2008/2008-08-27.json
Downloading 2008-08-28
Writing to data/guardian/jobs-race/2008/2008-08-28.json
Downloading 2008-08-29
Writing to data/guardian/jobs-race/2008/2008-08-29.json
Downloading 2008-08-30
Writing to data/guardian/jobs-race/2008/2008-08-30.json
Downloading 2008-08-31
Writing to data/guardian/jobs-race/2008/2008-08-31.json
Downloading 2008-09-01
Writing to data/guardian/jobs-race/2008/2008-09-01.json
Downloading 2008-09-02
Writing to data/guardian/jobs-race/2008/2008-09-02.json
Downloading 2008-09-03
Writing to data/guardian/jobs-race/2008/2008-09-03.json
Downloading 2008-09-04
Writing to data/guardian/jobs-race/2008/2008-09-04.json
Downloading 2008-09-05
Writing to data/guardian/jobs-race/2008/2008-09-05.json
Downloading 2008-09-06
Writing to data/guardian/jobs-race/2008/2008-09-06.json
Downloading 2008-09-07
Writing to data/guardian/jobs-race/2008/2008-09-07.j

Writing to data/guardian/jobs-race/2004/2004-09-04.json
Downloading 2004-09-05
Writing to data/guardian/jobs-race/2004/2004-09-05.json
Downloading 2004-09-06
Writing to data/guardian/jobs-race/2004/2004-09-06.json
Downloading 2004-09-07
Writing to data/guardian/jobs-race/2004/2004-09-07.json
Downloading 2004-09-08
Writing to data/guardian/jobs-race/2004/2004-09-08.json
Downloading 2004-09-09
Writing to data/guardian/jobs-race/2004/2004-09-09.json
Downloading 2004-09-10
Writing to data/guardian/jobs-race/2004/2004-09-10.json
Downloading 2004-09-11
Writing to data/guardian/jobs-race/2004/2004-09-11.json
Downloading 2004-09-12
Writing to data/guardian/jobs-race/2004/2004-09-12.json
Downloading 2004-09-13
Writing to data/guardian/jobs-race/2004/2004-09-13.json
Downloading 2004-09-14
Writing to data/guardian/jobs-race/2004/2004-09-14.json
Downloading 2004-09-15
Writing to data/guardian/jobs-race/2004/2004-09-15.json
Downloading 2004-09-16
Writing to data/guardian/jobs-race/2004/2004-09-16.j

Writing to data/guardian/jobs-race/2000/2000-09-20.json
Downloading 2000-09-21
Writing to data/guardian/jobs-race/2000/2000-09-21.json
Downloading 2000-09-22
Writing to data/guardian/jobs-race/2000/2000-09-22.json
Downloading 2000-09-23
Writing to data/guardian/jobs-race/2000/2000-09-23.json
Downloading 2000-09-24
Writing to data/guardian/jobs-race/2000/2000-09-24.json
Downloading 2000-09-25
Writing to data/guardian/jobs-race/2000/2000-09-25.json
Downloading 2000-09-26
Writing to data/guardian/jobs-race/2000/2000-09-26.json
Downloading 2000-09-27
Writing to data/guardian/jobs-race/2000/2000-09-27.json
Downloading 2000-09-28
Writing to data/guardian/jobs-race/2000/2000-09-28.json
Downloading 2000-09-29
Writing to data/guardian/jobs-race/2000/2000-09-29.json
Downloading 2000-09-30
Writing to data/guardian/jobs-race/2000/2000-09-30.json
Downloading 2000-10-01
Writing to data/guardian/jobs-race/2000/2000-10-01.json
Downloading 2000-10-02
Writing to data/guardian/jobs-race/2000/2000-10-02.j

Writing to data/guardian/jobs-race/2020/2020-05-06.json
Downloading 2020-05-07
Writing to data/guardian/jobs-race/2020/2020-05-07.json
Downloading 2020-05-08
Writing to data/guardian/jobs-race/2020/2020-05-08.json
Downloading 2020-05-09
Writing to data/guardian/jobs-race/2020/2020-05-09.json
Downloading 2020-05-10
Writing to data/guardian/jobs-race/2020/2020-05-10.json
Downloading 2020-05-11
Writing to data/guardian/jobs-race/2020/2020-05-11.json
Downloading 2020-05-12
Writing to data/guardian/jobs-race/2020/2020-05-12.json
Downloading 2020-05-13
Writing to data/guardian/jobs-race/2020/2020-05-13.json
Downloading 2020-05-14
Writing to data/guardian/jobs-race/2020/2020-05-14.json
Downloading 2020-05-15
Writing to data/guardian/jobs-race/2020/2020-05-15.json
Downloading 2020-05-16
Writing to data/guardian/jobs-race/2020/2020-05-16.json
Downloading 2020-05-17
Writing to data/guardian/jobs-race/2020/2020-05-17.json
Downloading 2020-05-18
Writing to data/guardian/jobs-race/2020/2020-05-18.j

In [3]:
search_key_environemnt = '(global OR warming OR (green AND deal) OR environment OR (coal AND job) OR (fossil AND fuel))' 

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                        date(2016, 8, 8), date(2016, 11, 8), 'environment', '2016')

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                       date(2012, 8, 6), date(2012, 11, 6), 'environment', '2012')

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                       date(2008, 8, 4), date(2008, 11, 4), 'environment', '2008')

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                       date(2004, 8, 2), date(2004, 11, 2), 'environment', '2004')

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                       date(2000, 8, 7), date(2000, 11, 7), 'environment', '2000')

get_news_by_date_range(search_key_environemnt, 'headline,body', 'headline,body,sectionName',
                       date(2020, 3, 12), date(2020, 6, 12), 'environment', '2020')

Downloading 2016-08-08
Writing to data/guardian/environment/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/environment/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/environment/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/environment/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/environment/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/environment/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/environment/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/environment/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/environment/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/environment/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/environment/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/environment/2016/2016-08-19.json
Downloading 2016-08-20
Writi

Writing to data/guardian/environment/2012/2012-08-14.json
Downloading 2012-08-15
Writing to data/guardian/environment/2012/2012-08-15.json
Downloading 2012-08-16
Writing to data/guardian/environment/2012/2012-08-16.json
Downloading 2012-08-17
Writing to data/guardian/environment/2012/2012-08-17.json
Downloading 2012-08-18
Writing to data/guardian/environment/2012/2012-08-18.json
Downloading 2012-08-19
Writing to data/guardian/environment/2012/2012-08-19.json
Downloading 2012-08-20
Writing to data/guardian/environment/2012/2012-08-20.json
Downloading 2012-08-21
Writing to data/guardian/environment/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/environment/2012/2012-08-22.json
Downloading 2012-08-23
Writing to data/guardian/environment/2012/2012-08-23.json
Downloading 2012-08-24
Writing to data/guardian/environment/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/environment/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/env

Writing to data/guardian/environment/2008/2008-08-21.json
Downloading 2008-08-22
Writing to data/guardian/environment/2008/2008-08-22.json
Downloading 2008-08-23
Writing to data/guardian/environment/2008/2008-08-23.json
Downloading 2008-08-24
Writing to data/guardian/environment/2008/2008-08-24.json
Downloading 2008-08-25
Writing to data/guardian/environment/2008/2008-08-25.json
Downloading 2008-08-26
Writing to data/guardian/environment/2008/2008-08-26.json
Downloading 2008-08-27
Writing to data/guardian/environment/2008/2008-08-27.json
Downloading 2008-08-28
Writing to data/guardian/environment/2008/2008-08-28.json
Downloading 2008-08-29
Writing to data/guardian/environment/2008/2008-08-29.json
Downloading 2008-08-30
Writing to data/guardian/environment/2008/2008-08-30.json
Downloading 2008-08-31
Writing to data/guardian/environment/2008/2008-08-31.json
Downloading 2008-09-01
Writing to data/guardian/environment/2008/2008-09-01.json
Downloading 2008-09-02
Writing to data/guardian/env

Writing to data/guardian/environment/2004/2004-08-28.json
Downloading 2004-08-29
Writing to data/guardian/environment/2004/2004-08-29.json
Downloading 2004-08-30
Writing to data/guardian/environment/2004/2004-08-30.json
Downloading 2004-08-31
Writing to data/guardian/environment/2004/2004-08-31.json
Downloading 2004-09-01
Writing to data/guardian/environment/2004/2004-09-01.json
Downloading 2004-09-02
Writing to data/guardian/environment/2004/2004-09-02.json
Downloading 2004-09-03
Writing to data/guardian/environment/2004/2004-09-03.json
Downloading 2004-09-04
Writing to data/guardian/environment/2004/2004-09-04.json
Downloading 2004-09-05
Writing to data/guardian/environment/2004/2004-09-05.json
Downloading 2004-09-06
Writing to data/guardian/environment/2004/2004-09-06.json
Downloading 2004-09-07
Writing to data/guardian/environment/2004/2004-09-07.json
Downloading 2004-09-08
Writing to data/guardian/environment/2004/2004-09-08.json
Downloading 2004-09-09
Writing to data/guardian/env

Writing to data/guardian/environment/2000/2000-09-11.json
Downloading 2000-09-12
Writing to data/guardian/environment/2000/2000-09-12.json
Downloading 2000-09-13
Writing to data/guardian/environment/2000/2000-09-13.json
Downloading 2000-09-14
Writing to data/guardian/environment/2000/2000-09-14.json
Downloading 2000-09-15
Writing to data/guardian/environment/2000/2000-09-15.json
Downloading 2000-09-16
Writing to data/guardian/environment/2000/2000-09-16.json
Downloading 2000-09-17
Writing to data/guardian/environment/2000/2000-09-17.json
Downloading 2000-09-18
Writing to data/guardian/environment/2000/2000-09-18.json
Downloading 2000-09-19
Writing to data/guardian/environment/2000/2000-09-19.json
Downloading 2000-09-20
Writing to data/guardian/environment/2000/2000-09-20.json
Downloading 2000-09-21
Writing to data/guardian/environment/2000/2000-09-21.json
Downloading 2000-09-22
Writing to data/guardian/environment/2000/2000-09-22.json
Downloading 2000-09-23
Writing to data/guardian/env

Writing to data/guardian/environment/2020/2020-04-25.json
Downloading 2020-04-26
Writing to data/guardian/environment/2020/2020-04-26.json
Downloading 2020-04-27
Writing to data/guardian/environment/2020/2020-04-27.json
Downloading 2020-04-28
Writing to data/guardian/environment/2020/2020-04-28.json
Downloading 2020-04-29
Writing to data/guardian/environment/2020/2020-04-29.json
Downloading 2020-04-30
Writing to data/guardian/environment/2020/2020-04-30.json
Downloading 2020-05-01
Writing to data/guardian/environment/2020/2020-05-01.json
Downloading 2020-05-02
Writing to data/guardian/environment/2020/2020-05-02.json
Downloading 2020-05-03
Writing to data/guardian/environment/2020/2020-05-03.json
Downloading 2020-05-04
Writing to data/guardian/environment/2020/2020-05-04.json
Downloading 2020-05-05
Writing to data/guardian/environment/2020/2020-05-05.json
Downloading 2020-05-06
Writing to data/guardian/environment/2020/2020-05-06.json
Downloading 2020-05-07
Writing to data/guardian/env

In [5]:
def download_guardian_data(search_key, subdir):
    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                            date(2016, 8, 8), date(2016, 11, 8), subdir, '2016')

    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                           date(2012, 8, 6), date(2012, 11, 6), subdir, '2012')

    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                           date(2008, 8, 4), date(2008, 11, 4), subdir, '2008')

    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                           date(2004, 8, 2), date(2004, 11, 2), subdir, '2004')

    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                           date(2000, 8, 7), date(2000, 11, 7), subdir, '2000')

    get_news_by_date_range(search_key, 'headline,body', 'headline,body,sectionName',
                           date(2020, 3, 12), date(2020, 6, 12), subdir, '2020')

Downloading 2016-08-08
Writing to data/guardian/guns/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/guns/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/guns/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/guns/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/guns/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/guns/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/guns/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/guns/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/guns/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/guns/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/guns/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/guns/2016/2016-08-19.json
Downloading 2016-08-20
Writing to data/guardian/guns/2016/2016-08-20.json
Downloading 2016-08-21
Writing to data

Writing to data/guardian/guns/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/guns/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/guns/2012/2012-08-26.json
Downloading 2012-08-27
Writing to data/guardian/guns/2012/2012-08-27.json
Downloading 2012-08-28
Writing to data/guardian/guns/2012/2012-08-28.json
Downloading 2012-08-29
Writing to data/guardian/guns/2012/2012-08-29.json
Downloading 2012-08-30
Writing to data/guardian/guns/2012/2012-08-30.json
Downloading 2012-08-31
Writing to data/guardian/guns/2012/2012-08-31.json
Downloading 2012-09-01
Writing to data/guardian/guns/2012/2012-09-01.json
Downloading 2012-09-02
Writing to data/guardian/guns/2012/2012-09-02.json
Downloading 2012-09-03
Writing to data/guardian/guns/2012/2012-09-03.json
Downloading 2012-09-04
Writing to data/guardian/guns/2012/2012-09-04.json
Downloading 2012-09-05
Writing to data/guardian/guns/2012/2012-09-05.json
Downloading 2012-09-06
Writing to data/guardian/guns/2012/201

Writing to data/guardian/guns/2008/2008-09-09.json
Downloading 2008-09-10
Writing to data/guardian/guns/2008/2008-09-10.json
Downloading 2008-09-11
Writing to data/guardian/guns/2008/2008-09-11.json
Downloading 2008-09-12
Writing to data/guardian/guns/2008/2008-09-12.json
Downloading 2008-09-13
Writing to data/guardian/guns/2008/2008-09-13.json
Downloading 2008-09-14
Writing to data/guardian/guns/2008/2008-09-14.json
Downloading 2008-09-15
Writing to data/guardian/guns/2008/2008-09-15.json
Downloading 2008-09-16
Writing to data/guardian/guns/2008/2008-09-16.json
Downloading 2008-09-17
Writing to data/guardian/guns/2008/2008-09-17.json
Downloading 2008-09-18
Writing to data/guardian/guns/2008/2008-09-18.json
Downloading 2008-09-19
Writing to data/guardian/guns/2008/2008-09-19.json
Downloading 2008-09-20
Writing to data/guardian/guns/2008/2008-09-20.json
Downloading 2008-09-21
Writing to data/guardian/guns/2008/2008-09-21.json
Downloading 2008-09-22
Writing to data/guardian/guns/2008/200

Writing to data/guardian/guns/2004/2004-09-25.json
Downloading 2004-09-26
Writing to data/guardian/guns/2004/2004-09-26.json
Downloading 2004-09-27
Writing to data/guardian/guns/2004/2004-09-27.json
Downloading 2004-09-28
Writing to data/guardian/guns/2004/2004-09-28.json
Downloading 2004-09-29
Writing to data/guardian/guns/2004/2004-09-29.json
Downloading 2004-09-30
Writing to data/guardian/guns/2004/2004-09-30.json
Downloading 2004-10-01
Writing to data/guardian/guns/2004/2004-10-01.json
Downloading 2004-10-02
Writing to data/guardian/guns/2004/2004-10-02.json
Downloading 2004-10-03
Writing to data/guardian/guns/2004/2004-10-03.json
Downloading 2004-10-04
Writing to data/guardian/guns/2004/2004-10-04.json
Downloading 2004-10-05
Writing to data/guardian/guns/2004/2004-10-05.json
Downloading 2004-10-06
Writing to data/guardian/guns/2004/2004-10-06.json
Downloading 2004-10-07
Writing to data/guardian/guns/2004/2004-10-07.json
Downloading 2004-10-08
Writing to data/guardian/guns/2004/200

Writing to data/guardian/guns/2000/2000-10-18.json
Downloading 2000-10-19
Writing to data/guardian/guns/2000/2000-10-19.json
Downloading 2000-10-20
Writing to data/guardian/guns/2000/2000-10-20.json
Downloading 2000-10-21
Writing to data/guardian/guns/2000/2000-10-21.json
Downloading 2000-10-22
Writing to data/guardian/guns/2000/2000-10-22.json
Downloading 2000-10-23
Writing to data/guardian/guns/2000/2000-10-23.json
Downloading 2000-10-24
Writing to data/guardian/guns/2000/2000-10-24.json
Downloading 2000-10-25
Writing to data/guardian/guns/2000/2000-10-25.json
Downloading 2000-10-26
Writing to data/guardian/guns/2000/2000-10-26.json
Downloading 2000-10-27
Writing to data/guardian/guns/2000/2000-10-27.json
Downloading 2000-10-28
Writing to data/guardian/guns/2000/2000-10-28.json
Downloading 2000-10-29
Writing to data/guardian/guns/2000/2000-10-29.json
Downloading 2000-10-30
Writing to data/guardian/guns/2000/2000-10-30.json
Downloading 2000-10-31
Writing to data/guardian/guns/2000/200

Writing to data/guardian/guns/2020/2020-06-10.json
Downloading 2020-06-11
Writing to data/guardian/guns/2020/2020-06-11.json
Downloading 2020-06-12
Writing to data/guardian/guns/2020/2020-06-12.json


In [11]:
search_key_foreign_policy = '(terrorism OR (defence AND budget) OR iran OR iraq OR afganisthan OR troops OR syria OR libya OR (north AND korea) OR china OR russia OR nato OR mexico OR canada)' 
download_guardian_data(search_key_environment, 'foreign-policy')

Downloading 2016-08-08
Writing to data/guardian/foreign-policy/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/foreign-policy/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/foreign-policy/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/foreign-policy/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/foreign-policy/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/foreign-policy/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/foreign-policy/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/foreign-policy/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/foreign-policy/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/foreign-policy/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/foreign-policy/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/foreign-policy/2016/2016-08-

Writing to data/guardian/foreign-policy/2012/2012-08-11.json
Downloading 2012-08-12
Writing to data/guardian/foreign-policy/2012/2012-08-12.json
Downloading 2012-08-13
Writing to data/guardian/foreign-policy/2012/2012-08-13.json
Downloading 2012-08-14
Writing to data/guardian/foreign-policy/2012/2012-08-14.json
Downloading 2012-08-15
Writing to data/guardian/foreign-policy/2012/2012-08-15.json
Downloading 2012-08-16
Writing to data/guardian/foreign-policy/2012/2012-08-16.json
Downloading 2012-08-17
Writing to data/guardian/foreign-policy/2012/2012-08-17.json
Downloading 2012-08-18
Writing to data/guardian/foreign-policy/2012/2012-08-18.json
Downloading 2012-08-19
Writing to data/guardian/foreign-policy/2012/2012-08-19.json
Downloading 2012-08-20
Writing to data/guardian/foreign-policy/2012/2012-08-20.json
Downloading 2012-08-21
Writing to data/guardian/foreign-policy/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/foreign-policy/2012/2012-08-22.json
Downloading 201

Writing to data/guardian/foreign-policy/2008/2008-08-14.json
Downloading 2008-08-15
Writing to data/guardian/foreign-policy/2008/2008-08-15.json
Downloading 2008-08-16
Writing to data/guardian/foreign-policy/2008/2008-08-16.json
Downloading 2008-08-17
Writing to data/guardian/foreign-policy/2008/2008-08-17.json
Downloading 2008-08-18
Writing to data/guardian/foreign-policy/2008/2008-08-18.json
Downloading 2008-08-19
Writing to data/guardian/foreign-policy/2008/2008-08-19.json
Downloading 2008-08-20
Writing to data/guardian/foreign-policy/2008/2008-08-20.json
Downloading 2008-08-21
Writing to data/guardian/foreign-policy/2008/2008-08-21.json
Downloading 2008-08-22
Writing to data/guardian/foreign-policy/2008/2008-08-22.json
Downloading 2008-08-23
Writing to data/guardian/foreign-policy/2008/2008-08-23.json
Downloading 2008-08-24
Writing to data/guardian/foreign-policy/2008/2008-08-24.json
Downloading 2008-08-25
Writing to data/guardian/foreign-policy/2008/2008-08-25.json
Downloading 200

Writing to data/guardian/foreign-policy/2004/2004-08-17.json
Downloading 2004-08-18
Writing to data/guardian/foreign-policy/2004/2004-08-18.json
Downloading 2004-08-19
Writing to data/guardian/foreign-policy/2004/2004-08-19.json
Downloading 2004-08-20
Writing to data/guardian/foreign-policy/2004/2004-08-20.json
Downloading 2004-08-21
Writing to data/guardian/foreign-policy/2004/2004-08-21.json
Downloading 2004-08-22
Writing to data/guardian/foreign-policy/2004/2004-08-22.json
Downloading 2004-08-23
Writing to data/guardian/foreign-policy/2004/2004-08-23.json
Downloading 2004-08-24
Writing to data/guardian/foreign-policy/2004/2004-08-24.json
Downloading 2004-08-25
Writing to data/guardian/foreign-policy/2004/2004-08-25.json
Downloading 2004-08-26
Writing to data/guardian/foreign-policy/2004/2004-08-26.json
Downloading 2004-08-27
Writing to data/guardian/foreign-policy/2004/2004-08-27.json
Downloading 2004-08-28
Writing to data/guardian/foreign-policy/2004/2004-08-28.json
Downloading 200

Writing to data/guardian/foreign-policy/2000/2000-08-27.json
Downloading 2000-08-28
Writing to data/guardian/foreign-policy/2000/2000-08-28.json
Downloading 2000-08-29
Writing to data/guardian/foreign-policy/2000/2000-08-29.json
Downloading 2000-08-30
Writing to data/guardian/foreign-policy/2000/2000-08-30.json
Downloading 2000-08-31
Writing to data/guardian/foreign-policy/2000/2000-08-31.json
Downloading 2000-09-01
Writing to data/guardian/foreign-policy/2000/2000-09-01.json
Downloading 2000-09-02
Writing to data/guardian/foreign-policy/2000/2000-09-02.json
Downloading 2000-09-03
Writing to data/guardian/foreign-policy/2000/2000-09-03.json
Downloading 2000-09-04
Writing to data/guardian/foreign-policy/2000/2000-09-04.json
Downloading 2000-09-05
Writing to data/guardian/foreign-policy/2000/2000-09-05.json
Downloading 2000-09-06
Writing to data/guardian/foreign-policy/2000/2000-09-06.json
Downloading 2000-09-07
Writing to data/guardian/foreign-policy/2000/2000-09-07.json
Downloading 200

Writing to data/guardian/foreign-policy/2020/2020-04-06.json
Downloading 2020-04-07
Writing to data/guardian/foreign-policy/2020/2020-04-07.json
Downloading 2020-04-08
Writing to data/guardian/foreign-policy/2020/2020-04-08.json
Downloading 2020-04-09
Writing to data/guardian/foreign-policy/2020/2020-04-09.json
Downloading 2020-04-10
Writing to data/guardian/foreign-policy/2020/2020-04-10.json
Downloading 2020-04-11
Writing to data/guardian/foreign-policy/2020/2020-04-11.json
Downloading 2020-04-12
Writing to data/guardian/foreign-policy/2020/2020-04-12.json
Downloading 2020-04-13
Writing to data/guardian/foreign-policy/2020/2020-04-13.json
Downloading 2020-04-14
Writing to data/guardian/foreign-policy/2020/2020-04-14.json
Downloading 2020-04-15
Writing to data/guardian/foreign-policy/2020/2020-04-15.json
Downloading 2020-04-16
Writing to data/guardian/foreign-policy/2020/2020-04-16.json
Downloading 2020-04-17
Writing to data/guardian/foreign-policy/2020/2020-04-17.json
Downloading 202

In [13]:
search_key_environment = '(gun OR control OR law OR legislation OR background OR check OR shooting OR (semi AND automatic))' 
download_guardian_data(search_key_environment, 'guns')

Downloading 2016-08-08
Writing to data/guardian/guns/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/guns/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/guns/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/guns/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/guns/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/guns/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/guns/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/guns/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/guns/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/guns/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/guns/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/guns/2016/2016-08-19.json
Downloading 2016-08-20
Writing to data/guardian/guns/2016/2016-08-20.json
Downloading 2016-08-21
Writing to data

Writing to data/guardian/guns/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/guns/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/guns/2012/2012-08-26.json
Downloading 2012-08-27
Writing to data/guardian/guns/2012/2012-08-27.json
Downloading 2012-08-28
Writing to data/guardian/guns/2012/2012-08-28.json
Downloading 2012-08-29
Writing to data/guardian/guns/2012/2012-08-29.json
Downloading 2012-08-30
Writing to data/guardian/guns/2012/2012-08-30.json
Downloading 2012-08-31
Writing to data/guardian/guns/2012/2012-08-31.json
Downloading 2012-09-01
Writing to data/guardian/guns/2012/2012-09-01.json
Downloading 2012-09-02
Writing to data/guardian/guns/2012/2012-09-02.json
Downloading 2012-09-03
Writing to data/guardian/guns/2012/2012-09-03.json
Downloading 2012-09-04
Writing to data/guardian/guns/2012/2012-09-04.json
Downloading 2012-09-05
Writing to data/guardian/guns/2012/2012-09-05.json
Downloading 2012-09-06
Writing to data/guardian/guns/2012/201

Writing to data/guardian/guns/2008/2008-09-09.json
Downloading 2008-09-10
Writing to data/guardian/guns/2008/2008-09-10.json
Downloading 2008-09-11
Writing to data/guardian/guns/2008/2008-09-11.json
Downloading 2008-09-12
Writing to data/guardian/guns/2008/2008-09-12.json
Downloading 2008-09-13
Writing to data/guardian/guns/2008/2008-09-13.json
Downloading 2008-09-14
Writing to data/guardian/guns/2008/2008-09-14.json
Downloading 2008-09-15
Writing to data/guardian/guns/2008/2008-09-15.json
Downloading 2008-09-16
Writing to data/guardian/guns/2008/2008-09-16.json
Downloading 2008-09-17
Writing to data/guardian/guns/2008/2008-09-17.json
Downloading 2008-09-18
Writing to data/guardian/guns/2008/2008-09-18.json
Downloading 2008-09-19
Writing to data/guardian/guns/2008/2008-09-19.json
Downloading 2008-09-20
Writing to data/guardian/guns/2008/2008-09-20.json
Downloading 2008-09-21
Writing to data/guardian/guns/2008/2008-09-21.json
Downloading 2008-09-22
Writing to data/guardian/guns/2008/200

Writing to data/guardian/guns/2004/2004-09-25.json
Downloading 2004-09-26
Writing to data/guardian/guns/2004/2004-09-26.json
Downloading 2004-09-27
Writing to data/guardian/guns/2004/2004-09-27.json
Downloading 2004-09-28
Writing to data/guardian/guns/2004/2004-09-28.json
Downloading 2004-09-29
Writing to data/guardian/guns/2004/2004-09-29.json
Downloading 2004-09-30
Writing to data/guardian/guns/2004/2004-09-30.json
Downloading 2004-10-01
Writing to data/guardian/guns/2004/2004-10-01.json
Downloading 2004-10-02
Writing to data/guardian/guns/2004/2004-10-02.json
Downloading 2004-10-03
Writing to data/guardian/guns/2004/2004-10-03.json
Downloading 2004-10-04
Writing to data/guardian/guns/2004/2004-10-04.json
Downloading 2004-10-05
Writing to data/guardian/guns/2004/2004-10-05.json
Downloading 2004-10-06
Writing to data/guardian/guns/2004/2004-10-06.json
Downloading 2004-10-07
Writing to data/guardian/guns/2004/2004-10-07.json
Downloading 2004-10-08
Writing to data/guardian/guns/2004/200

Writing to data/guardian/guns/2000/2000-10-18.json
Downloading 2000-10-19
Writing to data/guardian/guns/2000/2000-10-19.json
Downloading 2000-10-20
Writing to data/guardian/guns/2000/2000-10-20.json
Downloading 2000-10-21
Writing to data/guardian/guns/2000/2000-10-21.json
Downloading 2000-10-22
Writing to data/guardian/guns/2000/2000-10-22.json
Downloading 2000-10-23
Writing to data/guardian/guns/2000/2000-10-23.json
Downloading 2000-10-24
Writing to data/guardian/guns/2000/2000-10-24.json
Downloading 2000-10-25
Writing to data/guardian/guns/2000/2000-10-25.json
Downloading 2000-10-26
Writing to data/guardian/guns/2000/2000-10-26.json
Downloading 2000-10-27
Writing to data/guardian/guns/2000/2000-10-27.json
Downloading 2000-10-28
Writing to data/guardian/guns/2000/2000-10-28.json
Downloading 2000-10-29
Writing to data/guardian/guns/2000/2000-10-29.json
Downloading 2000-10-30
Writing to data/guardian/guns/2000/2000-10-30.json
Downloading 2000-10-31
Writing to data/guardian/guns/2000/200

Writing to data/guardian/guns/2020/2020-06-10.json
Downloading 2020-06-11
Writing to data/guardian/guns/2020/2020-06-11.json
Downloading 2020-06-12
Writing to data/guardian/guns/2020/2020-06-12.json


In [14]:
search_key_health = 'healthcare OR insurance OR coverage OR prescription OR preexisting OR medicare OR pocket OR cost OR aca OR affordable OR medicaid' 
download_guardian_data(search_key_health, 'health1')

Downloading 2016-08-08
Writing to data/guardian/health1/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/health1/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/health1/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/health1/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/health1/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/health1/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/health1/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/health1/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/health1/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/health1/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/health1/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/health1/2016/2016-08-19.json
Downloading 2016-08-20
Writing to data/guardian/health1/2016/2016-08-20.json

Writing to data/guardian/health1/2012/2012-08-20.json
Downloading 2012-08-21
Writing to data/guardian/health1/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/health1/2012/2012-08-22.json
Downloading 2012-08-23
Writing to data/guardian/health1/2012/2012-08-23.json
Downloading 2012-08-24
Writing to data/guardian/health1/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/health1/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/health1/2012/2012-08-26.json
Downloading 2012-08-27
Writing to data/guardian/health1/2012/2012-08-27.json
Downloading 2012-08-28
Writing to data/guardian/health1/2012/2012-08-28.json
Downloading 2012-08-29
Writing to data/guardian/health1/2012/2012-08-29.json
Downloading 2012-08-30
Writing to data/guardian/health1/2012/2012-08-30.json
Downloading 2012-08-31
Writing to data/guardian/health1/2012/2012-08-31.json
Downloading 2012-09-01
Writing to data/guardian/health1/2012/2012-09-01.json
Downloading 2012-09-02

Writing to data/guardian/health1/2008/2008-09-01.json
Downloading 2008-09-02
Writing to data/guardian/health1/2008/2008-09-02.json
Downloading 2008-09-03
Writing to data/guardian/health1/2008/2008-09-03.json
Downloading 2008-09-04
Writing to data/guardian/health1/2008/2008-09-04.json
Downloading 2008-09-05
Writing to data/guardian/health1/2008/2008-09-05.json
Downloading 2008-09-06
Writing to data/guardian/health1/2008/2008-09-06.json
Downloading 2008-09-07
Writing to data/guardian/health1/2008/2008-09-07.json
Downloading 2008-09-08
Writing to data/guardian/health1/2008/2008-09-08.json
Downloading 2008-09-09
Writing to data/guardian/health1/2008/2008-09-09.json
Downloading 2008-09-10
Writing to data/guardian/health1/2008/2008-09-10.json
Downloading 2008-09-11
Writing to data/guardian/health1/2008/2008-09-11.json
Downloading 2008-09-12
Writing to data/guardian/health1/2008/2008-09-12.json
Downloading 2008-09-13
Writing to data/guardian/health1/2008/2008-09-13.json
Downloading 2008-09-14

ConnectionError: HTTPConnectionPool(host='content.guardianapis.com', port=80): Max retries exceeded with url: /search?from-date=2004-08-24&to-date=2004-08-24&order-by=newest&edition=US&show-fields=headline%2Cbody%2CsectionName&q=healthcare+OR+insurance+OR+coverage+OR+prescription+OR+preexisting+OR+medicare+OR+pocket+OR+cost+OR+aca+OR+affordable+OR+medicaid&query-fields=headline%2Cbody&sectionName=politics&page-size=200&api-key=73b806db-dd72-4f01-a965-9179f7b71c6f&page=1 (Caused by NewConnectionError('<urllib3.connection.HTTPConnection object at 0x7f304e7c1048>: Failed to establish a new connection: [Errno 113] No route to host'))

In [15]:
search_key_imm = 'immigration OR undocumented OR mexico OR asylum OR (south AND border) OR deport OR ICE OR USCIS OR refugee OR migrant OR visa OR (green AND card)'
download_guardian_data(search_key_imm, 'immigration1')

Downloading 2016-08-08
Writing to data/guardian/immigration1/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/immigration1/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/immigration1/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/immigration1/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/immigration1/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/immigration1/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/immigration1/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/immigration1/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/immigration1/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/immigration1/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/immigration1/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/immigration1/2016/2016-08-19.json
Downloading 2016

Writing to data/guardian/immigration1/2012/2012-08-13.json
Downloading 2012-08-14
Writing to data/guardian/immigration1/2012/2012-08-14.json
Downloading 2012-08-15
Writing to data/guardian/immigration1/2012/2012-08-15.json
Downloading 2012-08-16
Writing to data/guardian/immigration1/2012/2012-08-16.json
Downloading 2012-08-17
Writing to data/guardian/immigration1/2012/2012-08-17.json
Downloading 2012-08-18
Writing to data/guardian/immigration1/2012/2012-08-18.json
Downloading 2012-08-19
Writing to data/guardian/immigration1/2012/2012-08-19.json
Downloading 2012-08-20
Writing to data/guardian/immigration1/2012/2012-08-20.json
Downloading 2012-08-21
Writing to data/guardian/immigration1/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/immigration1/2012/2012-08-22.json
Downloading 2012-08-23
Writing to data/guardian/immigration1/2012/2012-08-23.json
Downloading 2012-08-24
Writing to data/guardian/immigration1/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/

Writing to data/guardian/immigration1/2008/2008-08-18.json
Downloading 2008-08-19
Writing to data/guardian/immigration1/2008/2008-08-19.json
Downloading 2008-08-20
Writing to data/guardian/immigration1/2008/2008-08-20.json
Downloading 2008-08-21
Writing to data/guardian/immigration1/2008/2008-08-21.json
Downloading 2008-08-22
Writing to data/guardian/immigration1/2008/2008-08-22.json
Downloading 2008-08-23
Writing to data/guardian/immigration1/2008/2008-08-23.json
Downloading 2008-08-24
Writing to data/guardian/immigration1/2008/2008-08-24.json
Downloading 2008-08-25
Writing to data/guardian/immigration1/2008/2008-08-25.json
Downloading 2008-08-26
Writing to data/guardian/immigration1/2008/2008-08-26.json
Downloading 2008-08-27
Writing to data/guardian/immigration1/2008/2008-08-27.json
Downloading 2008-08-28
Writing to data/guardian/immigration1/2008/2008-08-28.json
Downloading 2008-08-29
Writing to data/guardian/immigration1/2008/2008-08-29.json
Downloading 2008-08-30
Writing to data/

Writing to data/guardian/immigration1/2004/2004-08-23.json
Downloading 2004-08-24
Writing to data/guardian/immigration1/2004/2004-08-24.json
Downloading 2004-08-25
Writing to data/guardian/immigration1/2004/2004-08-25.json
Downloading 2004-08-26
Writing to data/guardian/immigration1/2004/2004-08-26.json
Downloading 2004-08-27
Writing to data/guardian/immigration1/2004/2004-08-27.json
Downloading 2004-08-28
Writing to data/guardian/immigration1/2004/2004-08-28.json
Downloading 2004-08-29
Writing to data/guardian/immigration1/2004/2004-08-29.json
Downloading 2004-08-30
Writing to data/guardian/immigration1/2004/2004-08-30.json
Downloading 2004-08-31
Writing to data/guardian/immigration1/2004/2004-08-31.json
Downloading 2004-09-01
Writing to data/guardian/immigration1/2004/2004-09-01.json
Downloading 2004-09-02
Writing to data/guardian/immigration1/2004/2004-09-02.json
Downloading 2004-09-03
Writing to data/guardian/immigration1/2004/2004-09-03.json
Downloading 2004-09-04
Writing to data/

Writing to data/guardian/immigration1/2000/2000-09-04.json
Downloading 2000-09-05
Writing to data/guardian/immigration1/2000/2000-09-05.json
Downloading 2000-09-06
Writing to data/guardian/immigration1/2000/2000-09-06.json
Downloading 2000-09-07
Writing to data/guardian/immigration1/2000/2000-09-07.json
Downloading 2000-09-08
Writing to data/guardian/immigration1/2000/2000-09-08.json
Downloading 2000-09-09
Writing to data/guardian/immigration1/2000/2000-09-09.json
Downloading 2000-09-10
Writing to data/guardian/immigration1/2000/2000-09-10.json
Downloading 2000-09-11
Writing to data/guardian/immigration1/2000/2000-09-11.json
Downloading 2000-09-12
Writing to data/guardian/immigration1/2000/2000-09-12.json
Downloading 2000-09-13
Writing to data/guardian/immigration1/2000/2000-09-13.json
Downloading 2000-09-14
Writing to data/guardian/immigration1/2000/2000-09-14.json
Downloading 2000-09-15
Writing to data/guardian/immigration1/2000/2000-09-15.json
Downloading 2000-09-16
Writing to data/

Writing to data/guardian/immigration1/2020/2020-04-16.json
Downloading 2020-04-17
Writing to data/guardian/immigration1/2020/2020-04-17.json
Downloading 2020-04-18
Writing to data/guardian/immigration1/2020/2020-04-18.json
Downloading 2020-04-19
Writing to data/guardian/immigration1/2020/2020-04-19.json
Downloading 2020-04-20
Writing to data/guardian/immigration1/2020/2020-04-20.json
Downloading 2020-04-21
Writing to data/guardian/immigration1/2020/2020-04-21.json
Downloading 2020-04-22
Writing to data/guardian/immigration1/2020/2020-04-22.json
Downloading 2020-04-23
Writing to data/guardian/immigration1/2020/2020-04-23.json
Downloading 2020-04-24
Writing to data/guardian/immigration1/2020/2020-04-24.json
Downloading 2020-04-25
Writing to data/guardian/immigration1/2020/2020-04-25.json
Downloading 2020-04-26
Writing to data/guardian/immigration1/2020/2020-04-26.json
Downloading 2020-04-27
Writing to data/guardian/immigration1/2020/2020-04-27.json
Downloading 2020-04-28
Writing to data/

In [16]:
search_key_party = 'democrat OR republican OR senate OR house OR campaign OR (super AND pac) OR rallies OR protests' 
download_guardian_data(search_key_environment, 'party1')


Downloading 2016-08-08
Writing to data/guardian/party1/2016/2016-08-08.json
Downloading 2016-08-09
Writing to data/guardian/party1/2016/2016-08-09.json
Downloading 2016-08-10
Writing to data/guardian/party1/2016/2016-08-10.json
Downloading 2016-08-11
Writing to data/guardian/party1/2016/2016-08-11.json
Downloading 2016-08-12
Writing to data/guardian/party1/2016/2016-08-12.json
Downloading 2016-08-13
Writing to data/guardian/party1/2016/2016-08-13.json
Downloading 2016-08-14
Writing to data/guardian/party1/2016/2016-08-14.json
Downloading 2016-08-15
Writing to data/guardian/party1/2016/2016-08-15.json
Downloading 2016-08-16
Writing to data/guardian/party1/2016/2016-08-16.json
Downloading 2016-08-17
Writing to data/guardian/party1/2016/2016-08-17.json
Downloading 2016-08-18
Writing to data/guardian/party1/2016/2016-08-18.json
Downloading 2016-08-19
Writing to data/guardian/party1/2016/2016-08-19.json
Downloading 2016-08-20
Writing to data/guardian/party1/2016/2016-08-20.json
Downloading 

Writing to data/guardian/party1/2012/2012-08-21.json
Downloading 2012-08-22
Writing to data/guardian/party1/2012/2012-08-22.json
Downloading 2012-08-23
Writing to data/guardian/party1/2012/2012-08-23.json
Downloading 2012-08-24
Writing to data/guardian/party1/2012/2012-08-24.json
Downloading 2012-08-25
Writing to data/guardian/party1/2012/2012-08-25.json
Downloading 2012-08-26
Writing to data/guardian/party1/2012/2012-08-26.json
Downloading 2012-08-27
Writing to data/guardian/party1/2012/2012-08-27.json
Downloading 2012-08-28
Writing to data/guardian/party1/2012/2012-08-28.json
Downloading 2012-08-29
Writing to data/guardian/party1/2012/2012-08-29.json
Downloading 2012-08-30
Writing to data/guardian/party1/2012/2012-08-30.json
Downloading 2012-08-31
Writing to data/guardian/party1/2012/2012-08-31.json
Downloading 2012-09-01
Writing to data/guardian/party1/2012/2012-09-01.json
Downloading 2012-09-02
Writing to data/guardian/party1/2012/2012-09-02.json
Downloading 2012-09-03
Writing to d

KeyboardInterrupt: 

In [None]:
search_key_economy = 'economy OR gdp OR stock OR market OR 401k OR retirement OR debt OR loan OR bailout OR bankruptcy OR stimulus OR stock OR market OR 401K OR retirement OR trade OR export OR import OR tax OR manufacture OR package' 
download_guardian_data(search_key_environment, 'economy1')