Skip to content

Commit

Permalink
add nigeria enugu state spider
Browse files Browse the repository at this point in the history
  • Loading branch information
Ravf95 committed Nov 12, 2021
1 parent b2d592d commit 229707a
Show file tree
Hide file tree
Showing 2 changed files with 33 additions and 0 deletions.
7 changes: 7 additions & 0 deletions docs/spiders.rst
Original file line number Diff line number Diff line change
Expand Up @@ -1001,6 +1001,13 @@ Nigeria
scrapy crawl nigeria_ekiti_state
.. autoclass:: kingfisher_scrapy.spiders.nigeria_enugu_state.NigeriaEnuguState
:no-members:

.. code-block:: bash
scrapy crawl nigeria_enugu_state
.. autoclass:: kingfisher_scrapy.spiders.nigeria_gombe_state.NigeriaGombeState
:no-members:

Expand Down
26 changes: 26 additions & 0 deletions kingfisher_scrapy/spiders/nigeria_enugu_state.py
Original file line number Diff line number Diff line change
@@ -0,0 +1,26 @@
import scrapy

from kingfisher_scrapy.base_spider import SimpleSpider
from kingfisher_scrapy.util import components, handle_http_error


class NigeriaEnuguState(SimpleSpider):
"""
Domain
Nigeria Enugu State Open Contracting Portal
"""
name = 'nigeria_enugu_state'
base_url = 'https://dueprocess.en.gov.ng/'

# SimpleSpider
data_type = 'release_package'

def start_requests(self):
url = f'{self.base_url}ocds_report.php/'
yield scrapy.Request(url, meta={'file_name': 'all.html'}, callback=self.parse_list)

@handle_http_error
def parse_list(self, response):
pattern = '//table[@id="contractTable"]/tbody/tr/td[3]/a/@href'
for item in response.xpath(pattern).getall():
yield self.build_request(f'{self.base_url}{item}', formatter=components(-1))

0 comments on commit 229707a

Please sign in to comment.