Skip to content

HTTPS clone URL

Subversion checkout URL

You can clone with HTTPS or Subversion.

Download ZIP
Browse files

given an url, retrieve name and ids of all voters

  • Loading branch information...
commit 1a7e2ad788f6041443c90431905d1d81d5955e72 1 parent e81639f
@neilkod neilkod authored
Showing with 19 additions and 0 deletions.
  1. +19 −0 scrape_oow_abstracts.py
View
19 scrape_oow_abstracts.py
@@ -0,0 +1,19 @@
+#!/usr/bin/python
+
+# huge work-in-progress
+# given an abstract page, retrieve the names and ids of all of the voters
+
+import re
+import urllib2
+from BeautifulSoup import BeautifulSoup
+url = 'https://mix.oracle.com/events/oow11/proposals/10916-oracle-11gr2-cluster-upgrade-success-story-a-complete-life-cycle'
+page = urllib2.urlopen(url)
+soup = BeautifulSoup(page)
+
+
+voters = soup.findAll('a',{"href":re.compile('/events/oow11/voting/view/'),"title":True})
+
+for voter in voters:
+ name = voter.get('title').lower()
+ id = re.findall(r'\d{3,}',voter.get('href'))[0]
+ print name, id
Please sign in to comment.
Something went wrong with that request. Please try again.