Skip to content

Commit

Permalink
Merge f93763b into 4b2ff8b
Browse files Browse the repository at this point in the history
  • Loading branch information
aguilerapy committed May 28, 2020
2 parents 4b2ff8b + f93763b commit 9fea48f
Show file tree
Hide file tree
Showing 22 changed files with 156 additions and 1 deletion.
7 changes: 6 additions & 1 deletion kingfisher_scrapy/spiders/armenia.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,11 @@


class Armenia(BaseSpider):
"""
Spider arguments
sample
Download only the first release package in the dataset.
"""
name = 'armenia'

def start_requests(self):
Expand All @@ -22,7 +27,7 @@ def parse(self, response):
data_type='release_package')

json_data = json.loads(response.text)
if not (self.sample):
if not self.sample:
if 'next_page' in json_data and 'uri' in json_data['next_page']:
url = json_data['next_page']['uri']
yield scrapy.Request(
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/australia.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,13 @@


class Australia(LinksSpider):
"""
API documentation
https://data.gov.au/dataset/ds-dga-5c7fa69b-b0e9-4553-b8df-2a022dd2e982/distribution/dist-dga-a7f471ad-e085-49b5-bd6b-1b270ea46e99/details?q=
Spider arguments
sample
Download only data released on 2018.
"""
name = 'australia'
data_type = 'release_package'

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/australia_nsw.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class AustraliaNSW(BaseSpider):
"""
API documentation
https://github.com/NSW-eTendering/NSW-eTendering-API/blob/master/README.md
Spider arguments
sample
Download only 30 releases.
"""
name = 'australia_nsw'

def start_requests(self):
Expand Down
5 changes: 5 additions & 0 deletions kingfisher_scrapy/spiders/chile_compra_bulk.py
Original file line number Diff line number Diff line change
Expand Up @@ -6,6 +6,11 @@


class ChileCompraBulk(ZipSpider):
"""
Spider arguments
sample
Download only data released on February 2017.
"""
name = 'chile_compra_bulk'
download_warnsize = 0
download_timeout = 99999
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/chile_compra_records.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,13 @@


class ChileCompraRecords(ChileCompraBaseSpider):
"""
Swagger API documentation
https://desarrolladores.mercadopublico.cl/docs/services/5a9ed02f718ed712f4403e75/operations/data-listaa-omes-agno-mes?
Spider arguments
sample
Download only data released on October 2017.
"""
name = 'chile_compra_records'

@handle_error
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/chile_compra_releases.py
Original file line number Diff line number Diff line change
Expand Up @@ -3,6 +3,13 @@


class ChileCompraReleases(ChileCompraBaseSpider):
"""
Swagger API documentation
https://desarrolladores.mercadopublico.cl/docs/services/5a9ed02f718ed712f4403e75/operations/data-listaa-omes-agno-mes?
Spider arguments
sample
Download only data released on October 2017.
"""
name = 'chile_compra_releases'

@handle_error
Expand Down
13 changes: 13 additions & 0 deletions kingfisher_scrapy/spiders/colombia.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,19 @@


class Colombia(LinksSpider):
"""
API documentation
https://www.colombiacompra.gov.co/transparencia/api
Swagger API documentation
https://apiocds.colombiacompra.gov.co:8443/apiCCE2.0/
Spider arguments
sample
Download only the first page of results.
page
The page number from which to start crawling.
year
The year to crawl. See API documentation for valid values.
"""
name = 'colombia'
sleep = 120 * 60

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/honduras_portal_records.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class HondurasPortalRecords(BaseSpider):
"""
API documentation
http://www.contratacionesabiertas.gob.hn/servicio/
Spider arguments
sample
Download only the first record package in the dataset.
"""
name = 'honduras_portal_records'
download_delay = 0.9

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/honduras_portal_releases.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class HondurasPortalReleases(BaseSpider):
"""
API documentation
http://www.contratacionesabiertas.gob.hn/servicio/
Spider arguments
sample
Download only the first release package in the dataset.
"""
name = 'honduras_portal_releases'
download_delay = 0.9

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/kenya_makueni.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class KenyaMakueni(BaseSpider):
"""
Swagger API documentation
https://opencontracting.makueni.go.ke/swagger-ui.html#/ocds-controller
Spider arguments
sample
Download only the first 10 release packages in the dataset.
"""
name = 'kenya_makueni'
url = 'https://opencontracting.makueni.go.ke/api/ocds/package/all?pageSize={}&pageNumber={}'

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/malta.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,13 @@


class Malta(ZipSpider):
"""
API documentation
https://docs.google.com/document/d/1VnCEywKkkQ7BcVbT7HlW2s_N_QI8W0KE/edit
Spider arguments
sample
Download only data released on October 2019.
"""
name = 'malta'

parse_zipfile_kwargs = {'data_type': 'record_package'}
Expand Down
9 changes: 9 additions & 0 deletions kingfisher_scrapy/spiders/mexico_quien_es_quien.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,15 @@


class MexicoQuienEsQuien(BaseSpider):
"""
API documentation
https://quienesquienapi.readthedocs.io/es/latest/
Swagger API documentation
https://api.quienesquien.wiki/v2/docs/
Spider arguments
sample
Download a single record package with 10 records.
"""
name = 'mexico_quien_es_quien'
download_delay = 0.9
url = 'https://api.quienesquien.wiki/v2/contracts?limit={}&offset={}'
Expand Down
5 changes: 5 additions & 0 deletions kingfisher_scrapy/spiders/nepal_dhangadhi.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,11 @@


class NepalDhangadhi(BaseSpider):
"""
Spider arguments
sample
Download only the first release package in the dataset.
"""
name = "nepal_dhangadhi"

def start_requests(self):
Expand Down
5 changes: 5 additions & 0 deletions kingfisher_scrapy/spiders/nepal_portal.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,11 @@


class NepalPortal(BaseSpider):
"""
Spider arguments
sample
Download only data released on 2018.
"""
name = 'nepal_portal'

def start_requests(self):
Expand Down
5 changes: 5 additions & 0 deletions kingfisher_scrapy/spiders/nigeria_portal.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,11 @@


class NigeriaPortal(BaseSpider):
"""
Spider arguments
sample
Download only the first release package in the dataset.
"""
name = 'nigeria_portal'
start_urls = ['http://nocopo.bpp.gov.ng/OpenData.aspx']
download_delay = 0.9
Expand Down
12 changes: 12 additions & 0 deletions kingfisher_scrapy/spiders/paraguay_hacienda.py
Original file line number Diff line number Diff line change
Expand Up @@ -9,6 +9,18 @@


class ParaguayHacienda(BaseSpider):
"""
Swagger API documentation
https://datos.hacienda.gov.py/odmh-api-v1/api-docs/
Spider arguments
sample
Download only 11 releases.
Environment variables
KINGFISHER_PARAGUAY_HACIENDA_REQUEST_TOKEN
To get an API account and request token go to https://datos.hacienda.gov.py/aplicaciones/new.
KINGFISHER_PARAGUAY_HACIENDA_CLIENT_SECRET
Your client secret generated.
"""
name = 'paraguay_hacienda'

start_time = None
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/portugal.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class Portugal(ZipSpider):
"""
API documentation
https://dados.gov.pt/pt/apidoc/
Spider arguments
sample
Download only the first file in the dataset.
"""
name = 'portugal'
download_warnsize = 0
download_timeout = 9999
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/uganda_releases.py
Original file line number Diff line number Diff line change
Expand Up @@ -8,6 +8,13 @@


class Uganda(BaseSpider):
"""
API documentation
https://docs.google.com/spreadsheets/d/10tVioy-VOQa1FwWoRl5e1pMbGpiymA0iycNcoDFkvks/edit#gid=365266172
Spider arguments
sample
Download only 19 releases.
"""
name = 'uganda_releases'
download_delay = 0.9

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/uruguay_historical.py
Original file line number Diff line number Diff line change
Expand Up @@ -4,6 +4,13 @@


class UruguayHistorical(ZipSpider):
"""
API documentation
https://www.gub.uy/agencia-compras-contrataciones-estado/datos-y-estadisticas/datos/open-contracting
Spider arguments
sample
Download only data released on 2002.
"""
name = 'uruguay_historical'
# the files takes too long to be downloaded, so we increase the download timeout
download_timeout = 1000
Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/uruguay_records.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,13 @@


class UruguayRecords(UruguayBase):
"""
API documentation
https://www.gub.uy/agencia-compras-contrataciones-estado/datos-y-estadisticas/datos/open-contracting
Spider arguments
sample
Download only 1 record.
"""
name = 'uruguay_records'
base_record_url = 'https://www.comprasestatales.gub.uy/ocds/record/{}'

Expand Down
7 changes: 7 additions & 0 deletions kingfisher_scrapy/spiders/uruguay_releases.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,13 @@


class UruguayReleases(UruguayBase):
"""
API documentation
https://www.gub.uy/agencia-compras-contrataciones-estado/datos-y-estadisticas/datos/open-contracting
Spider arguments
sample
Download only 1 release.
"""
name = 'uruguay_releases'

@handle_error
Expand Down
5 changes: 5 additions & 0 deletions kingfisher_scrapy/spiders/zambia.py
Original file line number Diff line number Diff line change
Expand Up @@ -7,6 +7,11 @@


class Zambia(ZipSpider):
"""
Spider arguments
sample
Download only data released on July 2016.
"""
name = 'zambia'

parse_zipfile_kwargs = {'data_type': 'record_package'}
Expand Down

0 comments on commit 9fea48f

Please sign in to comment.