diff --git a/scraper.py b/scraper.py index c64d47a..2a8c930 100644 --- a/scraper.py +++ b/scraper.py @@ -51,9 +51,12 @@ def get_cell_value(element, css): FIS_URL = "http://data.fis-ski.com/cross-country/results.html" for link, raceinfo in race_link_results(FIS_URL): - # html = scraperwiki.scrape(link) - # root = lxml.html.fromstring(html) - # result_table = root.cssselect("table.fisfootable")[0] + html = scraperwiki.scrape(link) + root = lxml.html.fromstring(html) + result_table = root.cssselect("table.footable")[0] + result_cells = result_table.cssselect("tr") + for result_cell in result_cells: + print result_cell print link print raceinfo['date'] scraperwiki.sqlite.save(unique_keys=['codex'], data=raceinfo, table_name="data")