Skip to content

Commit

Permalink
given an url, retrieve name and ids of all voters
Browse files Browse the repository at this point in the history
  • Loading branch information
neilkod committed Jun 17, 2011
1 parent e81639f commit 1a7e2ad
Showing 1 changed file with 19 additions and 0 deletions.
19 changes: 19 additions & 0 deletions scrape_oow_abstracts.py
@@ -0,0 +1,19 @@
#!/usr/bin/python

# huge work-in-progress
# given an abstract page, retrieve the names and ids of all of the voters

import re
import urllib2
from BeautifulSoup import BeautifulSoup
url = 'https://mix.oracle.com/events/oow11/proposals/10916-oracle-11gr2-cluster-upgrade-success-story-a-complete-life-cycle'
page = urllib2.urlopen(url)
soup = BeautifulSoup(page)


voters = soup.findAll('a',{"href":re.compile('/events/oow11/voting/view/'),"title":True})

for voter in voters:
name = voter.get('title').lower()
id = re.findall(r'\d{3,}',voter.get('href'))[0]
print name, id

0 comments on commit 1a7e2ad

Please sign in to comment.