Permalink
Browse files

Update scraper.py

  • Loading branch information...
danozgriff committed May 11, 2016
1 parent 568607c commit bccf9ba658ced8e6f29ee9443a635d7fdbad95e6
Showing with 3 additions and 1 deletion.
  1. +3 −1 scraper.py
View
@@ -3,7 +3,9 @@
u=urllib2.urlopen("http://pilbaraports.com.au/Shipping_Schedule/Current_Shipping_Schedule.pdf")
r=lxml.etree.fromstring(u)
x=scraperwiki.pdftoxml(u.read())
print x[:1024]
r=lxml.etree.fromstring(x)
r.xpath('//page[@number="1"]')
r.xpath('//text[@left="64"]/b')[0:10]
r.xpath('//text[@left="64"]/b')[8].text

0 comments on commit bccf9ba

Please sign in to comment.