Skip to content

Commit

Permalink
Update scraper.py
Browse files Browse the repository at this point in the history
  • Loading branch information
eirikeikaas committed Oct 25, 2018
1 parent 20f4282 commit afa57aa
Showing 1 changed file with 8 additions and 8 deletions.
16 changes: 8 additions & 8 deletions scraper.py
Expand Up @@ -57,19 +57,19 @@ def get_cell_value(element, css):
result_table = root.cssselect("table.footable")[0]
result_cells = result_table.cssselect("tr")
for result_cell in result_cells:
athlete_url = result_cell.cssselect("td")[2].cssselect("a")[0].get("href")
athlete_url = result_cell.cssselect("td")[1].cssselect("a")[0].get("href")
parsed = urlparse.urlparse(athlete_url)
athlete_id = urlparse.parse_qs(parsed.query)['competitorid']
result = {
'event': raceinfo['codex'],
'rank': get_cell_value(result_cell.cssselect("td")[1], ""),
'athlete': get_cell_value(result_cell.cssselect("td")[2], "a"),
'rank': get_cell_value(result_cell.cssselect("td")[0], ""),
'athlete': get_cell_value(result_cell.cssselect("td")[1], "a"),
'competitor_id': athlete_id,
'yob': get_cell_value(result_cell.cssselect("td")[3], ""),
'nation': get_cell_value(result_cell.cssselect("td")[4], ""),
'time': get_cell_value(result_cell.cssselect("td")[5], ""),
'behind': get_cell_value(result_cell.cssselect("td")[6], ""),
'points': get_cell_value(result_cell.cssselect("td")[7], "")
'yob': get_cell_value(result_cell.cssselect("td")[2], ""),
'nation': get_cell_value(result_cell.cssselect("td")[3], ""),
'time': get_cell_value(result_cell.cssselect("td")[4], ""),
'behind': get_cell_value(result_cell.cssselect("td")[5], ""),
'points': get_cell_value(result_cell.cssselect("td")[6], "")
}
print result
print link
Expand Down

0 comments on commit afa57aa

Please sign in to comment.