From 2d464d3f70110cd522d4deac43f75d847f384f78 Mon Sep 17 00:00:00 2001 From: Thomas Guignard Date: Fri, 29 Jul 2016 16:14:09 -0400 Subject: [PATCH] Deal with missing postal code --- scraper.py | 5 ++++- 1 file changed, 4 insertions(+), 1 deletion(-) diff --git a/scraper.py b/scraper.py index b63c962..5ca06cd 100644 --- a/scraper.py +++ b/scraper.py @@ -15,7 +15,10 @@ def parse_page(url): college_url = response.xpath('//*[@class="mem-contact"]/p[2]//a/@href')[0] college_address = response.xpath('//*[@class="mem-contact"]/p[1]/text()[1]')[0] college_city = response.xpath('//*[@class="mem-contact"]/p[1]/text()[2]')[0] - college_postalcode = response.xpath('//*[@class="mem-contact"]/p[1]/text()[3]')[0] + try: + college_postalcode = response.xpath('//*[@class="mem-contact"]/p[1]/text()[3]')[0] + except: + college_postalcode = '' #print "Successfully scraped %s in %s" % (college_name.decode('utf-8'), college_city)