From 622294e2ea9137e26a719fe48e8472a9ff3a44bc Mon Sep 17 00:00:00 2001 From: Andres Aguilera Date: Thu, 25 Jun 2020 19:54:38 -0400 Subject: [PATCH] Remove mexico_cdmx scraper --- kingfisher_scrapy/spiders/mexico_cdmx.py | 28 ------------------------ 1 file changed, 28 deletions(-) delete mode 100644 kingfisher_scrapy/spiders/mexico_cdmx.py diff --git a/kingfisher_scrapy/spiders/mexico_cdmx.py b/kingfisher_scrapy/spiders/mexico_cdmx.py deleted file mode 100644 index 00781dc20..000000000 --- a/kingfisher_scrapy/spiders/mexico_cdmx.py +++ /dev/null @@ -1,28 +0,0 @@ -import json - -import scrapy - -from kingfisher_scrapy.base_spider import SimpleSpider -from kingfisher_scrapy.util import components, handle_http_error - - -class MexicoCDMXSource(SimpleSpider): - name = 'mexico_cdmx' - data_type = 'release_package' - - def start_requests(self): - yield scrapy.Request( - 'http://www.contratosabiertos.cdmx.gob.mx/api/contratos/todos', - meta={'file_name': 'list.json'}, - callback=self.parse_list - ) - - @handle_http_error - def parse_list(self, response): - items = json.loads(response.text) - if self.sample: - items = [items[0]] - - for item in items: - # URL looks like http://www.contratosabiertos.cdmx.gob.mx/api/contrato/OCDS-87SD3T-SEDEMA-LP-0027-2017 - yield self.build_request(item['uri'], formatter=components(-1))