feat(script): add script

fabiancook · Nov 6, 2014 · 5f8b7ef · 5f8b7ef
1 parent 59d1a27
commit 5f8b7ef
Show file tree

Hide file tree

Showing 9 changed files with 271 additions and 0 deletions.
diff --git a/.idea/.name b/.idea/.name
diff --git a/.idea/countries_org-scraper.iml b/.idea/countries_org-scraper.iml
diff --git a/.idea/encodings.xml b/.idea/encodings.xml
diff --git a/.idea/misc.xml b/.idea/misc.xml
diff --git a/.idea/modules.xml b/.idea/modules.xml
diff --git a/.idea/scopes/scope_settings.xml b/.idea/scopes/scope_settings.xml
diff --git a/.idea/vcs.xml b/.idea/vcs.xml
diff --git a/.idea/workspace.xml b/.idea/workspace.xml
diff --git a/scraper.py b/scraper.py
@@ -21,3 +21,29 @@
 # on Morph for Python (https://github.com/openaustralia/morph-docker-python/blob/master/pip_requirements.txt) and all that matters
 # is that your final data is written to an Sqlite database called data.sqlite in the current working directory which
 # has at least a table called data.
+import scraperwiki
+impot lxml.html
+
+html = scrperwiki,scrape("http://countrycode.org/")
+
+root = lxml.html.fromstring(html)
+
+i = 0
+
+for tr in root.cssselect("#main_table_blue tbody tr")
+    i++
+    tds = tr.select("td")
+
+    iso = tds[1].text_content()
+    countryCode = tds[2].text_content()
+
+    isoSplit = iso.split('/')
+
+    data = {
+        'name': tds[0[.text_content().strip(),
+        'countryCode': int(countryCode),
+        'countryCodeUnique': i,
+        'ISO2': isoSplit[0].strip(),
+        'ISO3': isoSplit[1].strip()
+    }
+