-
Notifications
You must be signed in to change notification settings - Fork 0
/
datagetter.py
39 lines (34 loc) · 1.06 KB
/
datagetter.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
import csv, pandas, sys, time
import cPickle as pickle
'''
Import the training data and parse it
into a pandas data frame
'''
def get_data(fname='data/Train.csv'):
return pandas.read_csv(fname)
#d = {}
#with open(fname) as fin:
# a = time.time()
# print 'Reading data...',
# sys.stdout.flush()
# header = fin.readline().strip().split(',')[1:]
# reader = csv.reader(fin)
# for ii, row in enumerate(reader):
# d[row[0]] = {header[feat] : val for feat, val in enumerate(row[1:])}
# print 'done.'
# print 'Constructing data frame...',
# sys.stdout.flush()
# data = pandas.DataFrame.from_dict(d, orient='index')
# print 'done.'
# print 'Fetched data in {0} seconds.'.format(time.time() - a)
# return data
if __name__ == '__main__':
data = get_data('data/Train.csv')
print data
# Convenience function for loading pickle files
def read_file(fin):
try:
contents = pickle.load(open(fin, 'rb'))
return contents
except IOError:
return None