-
Notifications
You must be signed in to change notification settings - Fork 0
/
scraper.rb
28 lines (19 loc) · 814 Bytes
/
scraper.rb
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
require 'scraperwiki'
require 'mechanize'
mechanize = Mechanize.new
front_page = mechanize.get('http://www.dublincity.ie/main-menu-your-council-your-city-councillors/full-councillor-list')
page_urls = front_page.search('div#ctl00_PlaceHolderMain_ctl02__ControlWrapper_RichHtmlField a')
page_urls.each do |con_link|
con_page = Mechanize::Page::Link.new( con_link, mechanize, front_page ).click
if con_page.at('picture img')
image_url = con_page.at('picture source')['srcset'].gsub(/\s.+/, '')
else
image_url = con_page.at('div#textContent img')['src']
end
con_image = con_page.uri.merge image_url
puts con_image
con_text = con_page.search('div#eventDetails')
con_text.each do |con_string|
puts con_string.search('#text')
end
end