Skip to content
Permalink
master
Switch branches/tags
Go to file
 
 
Cannot retrieve contributors at this time
import codecs
import csv
import os
import datakit
URL = 'http://ykaku.com/ginkokensaku/ginkositen.zip'
OUTPUT_FILE_PATH = '/src/data/output.csv'
# GET raw data
datakit.download(URL, '/tmp/raw.zip')
# UNZIP data
datakit.unzip('/tmp/raw.zip', '/tmp')
# CONVERT data into CSV
with open(OUTPUT_FILE_PATH, 'w', newline='') as output:
spamwriter = csv.writer(output, delimiter=',', quotechar='"', quoting=csv.QUOTE_MINIMAL)
with codecs.open('/tmp/ginkositen.txt', 'r', 'shiftjis') as input:
spamreader = csv.reader(input, delimiter=',', quotechar='"')
for row in spamreader:
spamwriter.writerow([x.strip() for x in row])