In [141]:
import pandas as pd
import numpy as np

In [133]:
from pandas import Series, DataFrame

Series

A Series is a one-dimensional array-like object containing a sequence of      values (of similar types to NumPy types) and an associated array of data      labels, called its index. The simplest Series is      formed from only an array of data:

In [134]:
obj = pd.Series([4, 7, -5, 3])

In [135]:
obj

0    4
1    7
2   -5
3    3
dtype: int64

In [5]:
obj.values

array([ 4,  7, -5,  3], dtype=int64)

In [6]:
obj.index  #like range(4)

RangeIndex(start=0, stop=4, step=1)

In [7]:
obj2 = pd.Series([4, 7, -5, 3], index=['d', 'b', 'a', 'c'])

In [8]:
obj2

d    4
b    7
a   -5
c    3
dtype: int64

In [9]:
obj2.index

Index(['d', 'b', 'a', 'c'], dtype='object')

In [10]:
obj2['a']

-5

In [11]:
obj2['d'] = 6

In [12]:
obj2[['c', 'a', 'd']]

c    3
a   -5
d    6
dtype: int64

In [13]:
obj2[obj2 > 0]

d    6
b    7
c    3
dtype: int64

In [15]:
obj2 * 2

d    12
b    14
a   -10
c     6
dtype: int64

In [18]:
np.exp(obj2)

d     403.428793
b    1096.633158
a       0.006738
c      20.085537
dtype: float64

Should you have data contained in a Python dict, you can create a      Series from it by passing the dict:

In [19]:
sdata = {'Ohio' : 35000, 'Texas': 71000, 'Oregon': 16000, 'Utah': 5000}

In [20]:
obj3 = pd.Series(sdata)

In [21]:
obj3

Ohio      35000
Texas     71000
Oregon    16000
Utah       5000
dtype: int64

In [22]:
states = ['California', 'Ohio', 'Oregon', 'Texas']

In [23]:
obj4 = pd.Series(sdata, index=states)

In [24]:
obj4

California        NaN
Ohio          35000.0
Oregon        16000.0
Texas         71000.0
dtype: float64

In [25]:
pd.isnull(obj4)

California     True
Ohio          False
Oregon        False
Texas         False
dtype: bool

In [26]:
pd.notnull(obj4)

California    False
Ohio           True
Oregon         True
Texas          True
dtype: bool

In [27]:
obj4.isnull()

California     True
Ohio          False
Oregon        False
Texas         False
dtype: bool

In [28]:
obj3

Ohio      35000
Texas     71000
Oregon    16000
Utah       5000
dtype: int64

In [29]:
obj4

California        NaN
Ohio          35000.0
Oregon        16000.0
Texas         71000.0
dtype: float64

In [30]:
obj3 + obj4

California         NaN
Ohio           70000.0
Oregon         32000.0
Texas         142000.0
Utah               NaN
dtype: float64

In [31]:
obj4.name = 'population'

In [32]:
obj4.index.name = 'state'

In [33]:
obj4

state
California        NaN
Ohio          35000.0
Oregon        16000.0
Texas         71000.0
Name: population, dtype: float64

In [34]:
obj

0    4
1    7
2   -5
3    3
dtype: int64

DataFrame

A DataFrame represents a rectangular table of data and contains an      ordered collection of columns, each of which can be a different value      type (numeric, string, boolean, etc.).

In [39]:
data = {'state': ['Ohio', 'Ohio', 'Ohio', 'Nevada', 'Nevada', "Nevada"],
        'year': [2000, 2001, 2002, 2001, 2003, 2002],
        'pop': [1.5, 1.7, 3.6, 2.4, 2.9, 3.2]}

In [42]:
frame = pd.DataFrame(data)

In [43]:
frame.head()

Unnamed: 0,state,year,pop
0,Ohio,2000,1.5
1,Ohio,2001,1.7
2,Ohio,2002,3.6
3,Nevada,2001,2.4
4,Nevada,2003,2.9


In [44]:
frame

Unnamed: 0,state,year,pop
0,Ohio,2000,1.5
1,Ohio,2001,1.7
2,Ohio,2002,3.6
3,Nevada,2001,2.4
4,Nevada,2003,2.9
5,Nevada,2002,3.2


In [46]:
pd.DataFrame(data, columns=['year', 'state', 'pop'])

Unnamed: 0,year,state,pop
0,2000,Ohio,1.5
1,2001,Ohio,1.7
2,2002,Ohio,3.6
3,2001,Nevada,2.4
4,2003,Nevada,2.9
5,2002,Nevada,3.2


In [49]:
frame2 = pd.DataFrame(data, columns=['year', 'state', 'pop', 'debt'],
                     index =['One', 'Two', 'Three', 'Four', 'Five', 'Six'])

In [50]:
frame2

Unnamed: 0,year,state,pop,debt
One,2000,Ohio,1.5,
Two,2001,Ohio,1.7,
Three,2002,Ohio,3.6,
Four,2001,Nevada,2.4,
Five,2003,Nevada,2.9,
Six,2002,Nevada,3.2,


In [51]:
frame2.columns

Index(['year', 'state', 'pop', 'debt'], dtype='object')

In [52]:
frame2['state']

One        Ohio
Two        Ohio
Three      Ohio
Four     Nevada
Five     Nevada
Six      Nevada
Name: state, dtype: object

In [53]:
frame2.year

One      2000
Two      2001
Three    2002
Four     2001
Five     2003
Six      2002
Name: year, dtype: int64

In [54]:
frame2.loc['Three']

year     2002
state    Ohio
pop       3.6
debt      NaN
Name: Three, dtype: object

Columns can be modified by assignment. For example, the empty 'debt' column could be assigned a scalar value or an array of values:

In [55]:
frame2['debt'] = 16.5

In [56]:
frame2

Unnamed: 0,year,state,pop,debt
One,2000,Ohio,1.5,16.5
Two,2001,Ohio,1.7,16.5
Three,2002,Ohio,3.6,16.5
Four,2001,Nevada,2.4,16.5
Five,2003,Nevada,2.9,16.5
Six,2002,Nevada,3.2,16.5


In [57]:
frame2['debt'] = np.arange(6.)

In [58]:
frame2

Unnamed: 0,year,state,pop,debt
One,2000,Ohio,1.5,0.0
Two,2001,Ohio,1.7,1.0
Three,2002,Ohio,3.6,2.0
Four,2001,Nevada,2.4,3.0
Five,2003,Nevada,2.9,4.0
Six,2002,Nevada,3.2,5.0


In [59]:
val = pd.Series([-1.2, -1.5, -1.7], index=['Two', 'Three', 'Five'])

In [60]:
frame2['debt'] = val

In [61]:
frame2

Unnamed: 0,year,state,pop,debt
One,2000,Ohio,1.5,
Two,2001,Ohio,1.7,-1.2
Three,2002,Ohio,3.6,-1.5
Four,2001,Nevada,2.4,
Five,2003,Nevada,2.9,-1.7
Six,2002,Nevada,3.2,


In [62]:
frame2['eastern'] = frame2.state == 'Ohio'

In [63]:
frame2

Unnamed: 0,year,state,pop,debt,eastern
One,2000,Ohio,1.5,,True
Two,2001,Ohio,1.7,-1.2,True
Three,2002,Ohio,3.6,-1.5,True
Four,2001,Nevada,2.4,,False
Five,2003,Nevada,2.9,-1.7,False
Six,2002,Nevada,3.2,,False


In [64]:
del frame2['eastern']

In [65]:
frame2.columns

Index(['year', 'state', 'pop', 'debt'], dtype='object')

In [66]:
pop = {'Nevada': {2001: 2.4, 2002: 2.9},
      'Ohio': {2000: 1.5, 2001: 1.7, 2002: 3.6}}

In [67]:
frame3 = pd.DataFrame(pop)

In [68]:
frame3

Unnamed: 0,Nevada,Ohio
2000,,1.5
2001,2.4,1.7
2002,2.9,3.6


In [69]:
frame3.T

Unnamed: 0,2000,2001,2002
Nevada,,2.4,2.9
Ohio,1.5,1.7,3.6


In [70]:
pd.DataFrame(pop, index=[2001, 2002, 2003])

Unnamed: 0,Nevada,Ohio
2001,2.4,1.7
2002,2.9,3.6
2003,,


In [72]:
pdata = {'Ohio': frame3['Ohio'][:-1],
         'Nevada': frame3['Nevada'][:2]}

In [73]:
pd.DataFrame(pdata)

Unnamed: 0,Ohio,Nevada
2000,1.5,
2001,1.7,2.4


In [74]:
frame3.index.name = 'year'; frame3.columns.name = 'state'

In [75]:
frame3

state,Nevada,Ohio
year,Unnamed: 1_level_1,Unnamed: 2_level_1
2000,,1.5
2001,2.4,1.7
2002,2.9,3.6


In [76]:
frame3.values

array([[nan, 1.5],
       [2.4, 1.7],
       [2.9, 3.6]])

In [77]:
frame2.values

array([[2000, 'Ohio', 1.5, nan],
       [2001, 'Ohio', 1.7, -1.2],
       [2002, 'Ohio', 3.6, -1.5],
       [2001, 'Nevada', 2.4, nan],
       [2003, 'Nevada', 2.9, -1.7],
       [2002, 'Nevada', 3.2, nan]], dtype=object)

In [78]:
obj = pd.Series(range(3), index=['a', 'b', 'c'])

In [79]:
index = obj.index

In [80]:
index

Index(['a', 'b', 'c'], dtype='object')

In [81]:
index[1:]

Index(['b', 'c'], dtype='object')

In [82]:
index[1]

'b'

In [83]:
frame3

state,Nevada,Ohio
year,Unnamed: 1_level_1,Unnamed: 2_level_1
2000,,1.5
2001,2.4,1.7
2002,2.9,3.6


In [85]:
frame3.columns

Index(['Nevada', 'Ohio'], dtype='object', name='state')

In [86]:
'Ohio' in frame3.columns

True

In [87]:
2003 in frame3.index

False

In [88]:
frame = pd.DataFrame(np.arange(9).reshape(3, 3),
                    index=['a', 'c', 'd'],
                    columns=['Ohio', 'Texas', 'California'])

In [89]:
frame

Unnamed: 0,Ohio,Texas,California
a,0,1,2
c,3,4,5
d,6,7,8


In [91]:
frame2 = frame.reindex(['a', 'b', 'c', 'd'])

In [92]:
frame2

Unnamed: 0,Ohio,Texas,California
a,0.0,1.0,2.0
b,,,
c,3.0,4.0,5.0
d,6.0,7.0,8.0


In [93]:
states = ['Texas', 'Utah', 'California']

In [94]:
frame.reindex(columns=states)

Unnamed: 0,Texas,Utah,California
a,1,,2
c,4,,5
d,7,,8


You can reindex more succinctly by label-indexing with loc, and many users prefer to use it exclusively:

In [95]:
frame.loc[['a', 'b', 'c', 'd']]

Passing list-likes to .loc or [] with any missing label will raise
KeyError in the future, you can use .reindex() as an alternative.

See the documentation here:
https://pandas.pydata.org/pandas-docs/stable/indexing.html#deprecate-loc-reindex-listlike
  """Entry point for launching an IPython kernel.


Unnamed: 0,Ohio,Texas,California
a,0.0,1.0,2.0
b,,,
c,3.0,4.0,5.0
d,6.0,7.0,8.0


In [98]:
data = pd.DataFrame(np.arange(16).reshape((4,4)),
                   index=['Ohio', 'Colorado', 'Utah', 'New York'],
                   columns=['one', 'two', 'three', 'four'])

In [99]:
data

Unnamed: 0,one,two,three,four
Ohio,0,1,2,3
Colorado,4,5,6,7
Utah,8,9,10,11
New York,12,13,14,15


In [100]:
#Calling drop with a sequence of labels will      drop values from the row labels (axis 0):

data.drop(['Colorado', 'Ohio'])

Unnamed: 0,one,two,three,four
Utah,8,9,10,11
New York,12,13,14,15


In [101]:
#You can drop values from the columns by passing      axis=1 or axis='columns':

data.drop('two', axis=1)

Unnamed: 0,one,three,four
Ohio,0,2,3
Colorado,4,6,7
Utah,8,10,11
New York,12,14,15


In [103]:
data.drop(['two', 'four'], axis='columns')

Unnamed: 0,one,three
Ohio,0,2
Colorado,4,6
Utah,8,10
New York,12,14


In [104]:
obj.drop('c', inplace=True)

In [105]:
obj

a    0
b    1
dtype: int64

In [106]:
#Be careful with the inplace, as it destroys any data that is dropped.

In [108]:
data = pd.DataFrame(np.arange(16).reshape((4, 4)),
                   index=['Ohio', 'Colorado', 'Utah', 'New York'],
                   columns=['one', 'two', 'three', 'four'])

In [109]:
data

Unnamed: 0,one,two,three,four
Ohio,0,1,2,3
Colorado,4,5,6,7
Utah,8,9,10,11
New York,12,13,14,15


In [110]:
data['two']

Ohio         1
Colorado     5
Utah         9
New York    13
Name: two, dtype: int32

In [112]:
data[['three', 'one']]

Unnamed: 0,three,one
Ohio,2,0
Colorado,6,4
Utah,10,8
New York,14,12


In [113]:
data[:2]

Unnamed: 0,one,two,three,four
Ohio,0,1,2,3
Colorado,4,5,6,7


In [114]:
data[data['three'] >5]

Unnamed: 0,one,two,three,four
Colorado,4,5,6,7
Utah,8,9,10,11
New York,12,13,14,15


In [115]:
data < 5

Unnamed: 0,one,two,three,four
Ohio,True,True,True,True
Colorado,True,False,False,False
Utah,False,False,False,False
New York,False,False,False,False


In [116]:
data[data < 5] = 0

In [117]:
data

Unnamed: 0,one,two,three,four
Ohio,0,0,0,0
Colorado,0,5,6,7
Utah,8,9,10,11
New York,12,13,14,15


Data Loading, Storage, and File  Formats

In [150]:
df = pd.read_csv("C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv")

In [149]:
import csv
data = open(r"C:\Users\TejYadav\Desktop\Tests\annual-balance-sheets-200817.csv")
data = csv.reader(data)  
print(data)

<_csv.reader object at 0x0000018CCA697D48>


In [151]:
df

Unnamed: 0,Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values
0,2008.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,225544
1,2009.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,243315
2,2010.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,259381
3,2011.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,262596
4,2012.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,267100
5,2013.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,273639
6,2014.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,285309
7,2015.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,296896
8,2016.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,311332
9,2017.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,FINAL,331983


In [152]:
pd.read_table('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv')

  """Entry point for launching an IPython kernel.


Unnamed: 0,"Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values"
0,"2008.03,Corporate business enterprises,141,Cap..."
1,"2009.03,Corporate business enterprises,141,Cap..."
2,"2010.03,Corporate business enterprises,141,Cap..."
3,"2011.03,Corporate business enterprises,141,Cap..."
4,"2012.03,Corporate business enterprises,141,Cap..."
5,"2013.03,Corporate business enterprises,141,Cap..."
6,"2014.03,Corporate business enterprises,141,Cap..."
7,"2015.03,Corporate business enterprises,141,Cap..."
8,"2016.03,Corporate business enterprises,141,Cap..."
9,"2017.03,Corporate business enterprises,141,Cap..."


In [153]:
names = ['a', 'b', 'c', 'd', 'message']

In [154]:
pd.read_csv('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv')

Unnamed: 0,Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values
0,2008.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,225544
1,2009.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,243315
2,2010.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,259381
3,2011.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,262596
4,2012.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,267100
5,2013.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,273639
6,2014.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,285309
7,2015.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,296896
8,2016.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,311332
9,2017.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,FINAL,331983


In [155]:
pd.options.display.max_rows = 10

In [156]:
result = pd.read_csv('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv')

In [157]:
result

Unnamed: 0,Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values
0,2008.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,225544
1,2009.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,243315
2,2010.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,259381
3,2011.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,262596
4,2012.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,267100
...,...,...,...,...,...,...,...,...
18715,2013.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,FINAL,53768
18716,2014.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,58559
18717,2015.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,70099
18718,2016.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,76021


In [158]:
pd.read_csv('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv', nrows=5)

Unnamed: 0,Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values
0,2008.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,225544
1,2009.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,243315
2,2010.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,259381
3,2011.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,262596
4,2012.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,267100


In [162]:
'''
chunker = pd.read_csv('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv', chunksize=1000)

tot = pd.Series([])
for piece in chunker:
    tot = tot.add(piece['key'].value_counts(), fill_value=0)

tot = tot.sort_values(ascending=False)
'''

"\nchunker = pd.read_csv('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv', chunksize=1000)\n\ntot = pd.Series([])\nfor piece in chunker:\n    tot = tot.add(piece['key'].value_counts(), fill_value=0)\n\ntot = tot.sort_values(ascending=False)\n"

In [163]:
tot[:10]

Series([], dtype: float64)

In [164]:
import sys

data.to_csv(sys.stdout, sep='|')

AttributeError: '_csv.reader' object has no attribute 'to_csv'

In [165]:
data_to_csv(sys.stdout, index=False, header=False)

NameError: name 'data_to_csv' is not defined

In [167]:
import csv
f = open('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv')
reader = csv.reader(f)

In [168]:
for line in reader:
    print(line)

['ï»¿Year', 'Institutional_sector_name', 'Institutional_sector_code', 'Descriptor', 'SNA08TRANS', 'Asset_liability_code', 'Status', 'Values']
['2008.03', 'Corporate business enterprises', '141', 'Capital Account Opening balances Produced non-financial assets', 'LS00000', 'AN10000', 'REVISED', '225544']
['2009.03', 'Corporate business enterprises', '141', 'Capital Account Opening balances Produced non-financial assets', 'LS00000', 'AN10000', 'REVISED', '243315']
['2010.03', 'Corporate business enterprises', '141', 'Capital Account Opening balances Produced non-financial assets', 'LS00000', 'AN10000', 'REVISED', '259381']
['2011.03', 'Corporate business enterprises', '141', 'Capital Account Opening balances Produced non-financial assets', 'LS00000', 'AN10000', 'REVISED', '262596']
['2012.03', 'Corporate business enterprises', '141', 'Capital Account Opening balances Produced non-financial assets', 'LS00000', 'AN10000', 'REVISED', '267100']
['2013.03', 'Corporate business enterprises', '1

['2008.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes', 'K070000', 'AFA0600', 'FINAL', '0']
['2009.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes', 'K070000', 'AFA0600', 'FINAL', '0']
['2010.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes', 'K070000', 'AFA0600', 'FINAL', '0']
['2011.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes', 'K070000', 'AFA0600', 'FINAL', '0']
['2012.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes', 'K070000', 'AFA0600', 'FINAL', '0']
['2013.03', 'Financial auxiliaries', '27', 'Revaluation Account Financial assets Insurance, pension and standardised guarantee schemes'

['2008.03', 'Central government institutions excluding funded social insurance schemes', '311', 'Capital Account Closing balances Produced non-financial assets', 'LE00000', 'AN10000', 'REVISED', '48821']
['2009.03', 'Central government institutions excluding funded social insurance schemes', '311', 'Capital Account Closing balances Produced non-financial assets', 'LE00000', 'AN10000', 'REVISED', '54023']
['2010.03', 'Central government institutions excluding funded social insurance schemes', '311', 'Capital Account Closing balances Produced non-financial assets', 'LE00000', 'AN10000', 'REVISED', '57380']
['2011.03', 'Central government institutions excluding funded social insurance schemes', '311', 'Capital Account Closing balances Produced non-financial assets', 'LE00000', 'AN10000', 'REVISED', '57347']
['2012.03', 'Central government institutions excluding funded social insurance schemes', '311', 'Capital Account Closing balances Produced non-financial assets', 'LE00000', 'AN10000', 

['2017.03', 'Central government institutions funded social insurance schemes', '312', 'Other Changes in the Volume of Assets and Liabilities Financial liabilities', 'K050000', 'AFL0000', 'FINAL', '0']
['2008.03', 'Central government institutions funded social insurance schemes', '312', 'Other Changes in the Volume of Assets and Liabilities Changes in classification', 'K060000', 'AF00000', 'FINAL', '0']
['2009.03', 'Central government institutions funded social insurance schemes', '312', 'Other Changes in the Volume of Assets and Liabilities Changes in classification', 'K060000', 'AF00000', 'FINAL', '0']
['2010.03', 'Central government institutions funded social insurance schemes', '312', 'Other Changes in the Volume of Assets and Liabilities Changes in classification', 'K060000', 'AF00000', 'FINAL', '0']
['2011.03', 'Central government institutions funded social insurance schemes', '312', 'Other Changes in the Volume of Assets and Liabilities Changes in classification', 'K060000', 'AF0

['2017.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Non-produced non-financial assets', 'LS00000', 'AN20000', 'FINAL', '10010']
['2008.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Total non-financial assets', 'LS00000', 'AN00000', 'FINAL', '14034']
['2009.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Total non-financial assets', 'LS00000', 'AN00000', 'FINAL', '15268']
['2010.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Total non-financial assets', 'LS00000', 'AN00000', 'FINAL', '15587']
['2011.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Total non-financial assets', 'LS00000', 'AN00000', 'FINAL', '15647']
['2012.03', 'Non-profit institutions serving households', '411', 'Capital Account Opening balances Total non-financial assets', 'LS00000', 'AN00000', 'FI

['2008.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2009.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2010.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2011.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2012.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2013.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 'K070000', 'AFL0500', 'FINAL', '0']
['2014.03', 'Households', '511', 'Revaluation Account Financial liabilities Equity and investment fund shares', 

['2016.03', 'Rest of the world', '611', 'Financial assets Net transactions in equity and investment fund shares', 'F000000', 'AFA0500', 'REVISED', '6042']
['2017.03', 'Rest of the world', '611', 'Financial assets Net transactions in equity and investment fund shares', 'F000000', 'AFA0500', 'FINAL', '5738']
['2008.03', 'Rest of the world', '611', 'Financial assets Net transactions in insurance, pension, and standardised guarantee schemes', 'F000000', 'AFA0600', 'FINAL', '0']
['2009.03', 'Rest of the world', '611', 'Financial assets Net transactions in insurance, pension, and standardised guarantee schemes', 'F000000', 'AFA0600', 'FINAL', '0']
['2010.03', 'Rest of the world', '611', 'Financial assets Net transactions in insurance, pension, and standardised guarantee schemes', 'F000000', 'AFA0600', 'FINAL', '0']
['2011.03', 'Rest of the world', '611', 'Financial assets Net transactions in insurance, pension, and standardised guarantee schemes', 'F000000', 'AFA0600', 'FINAL', '0']
['2012.0

['2016.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closing balance equity and investment fund shares', 'LE00000', 'AFL0500', 'REVISED', '312518']
['2017.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closing balance equity and investment fund shares', 'LE00000', 'AFL0500', 'FINAL', '359125']
['2008.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closing balance insurance, pension, and standardised guarantee schemes', 'LE00000', 'AFL0600', 'FINAL', '0']
['2009.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closing balance insurance, pension, and standardised guarantee schemes', 'LE00000', 'AFL0600', 'FINAL', '0']
['2010.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closing balance insurance, pension, and standardised guarantee schemes', 'LE00000', 'AFL0600', 'FINAL', '0']
['2011.03', 'Non-corporate business enterprises', '121', 'Financial liabilities Closi

['2008.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '25604']
['2009.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '14558']
['2010.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '9594']
['2011.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '12119']
['2012.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '17343']
['2013.03', 'Registered banks', '221', 'Financial liabilities Opening balance equity and investment fund shares', 'LS00000', 'AFL0500', 'REVISED', '20220']
['2014.03', 'Registered banks', '221', 'Financial liabilities Ope

['2014.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Financial derivatives and employee stock options', 'K070000', 'AFA0700', 'FINAL', '0']
['2015.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Financial derivatives and employee stock options', 'K070000', 'AFA0700', 'FINAL', '0']
['2016.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Financial derivatives and employee stock options', 'K070000', 'AFA0700', 'FINAL', '0']
['2017.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Financial derivatives and employee stock options', 'K070000', 'AFA0700', 'FINAL', '0']
['2008.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Other accounts receivable', 'K070000', 'AFA0800', 'FINAL', '0']
['2009.03', 'Other depository institutions', '222', 'Revaluation Account Financial assets Other accounts receivable', 'K070000', 'AFA0800'

['2010.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2011.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2012.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2013.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2014.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2015.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2016.03', 'Investment funds', '231', 'Revaluation Account Financial liabilities Debt securities', 'K070000', 'AFL0300', 'FINAL', '0']
['2017.03', 'Investment funds', '231', 'Revaluat

['2017.03', 'Other financial intermediaries excluding insurance and pension funds', '241', 'Financial liabilities Closing balance other accounts payable', 'LE00000', 'AFL0800', 'FINAL', '579']
['2008.03', 'Other financial intermediaries excluding insurance and pension funds', '241', 'Financial liabilities Closing balance Total financial liabilities', 'LE00000', 'AFL0000', 'REVISED', '93218']
['2009.03', 'Other financial intermediaries excluding insurance and pension funds', '241', 'Financial liabilities Closing balance Total financial liabilities', 'LE00000', 'AFL0000', 'REVISED', '82343']
['2010.03', 'Other financial intermediaries excluding insurance and pension funds', '241', 'Financial liabilities Closing balance Total financial liabilities', 'LE00000', 'AFL0000', 'REVISED', '84943']
['2011.03', 'Other financial intermediaries excluding insurance and pension funds', '241', 'Financial liabilities Closing balance Total financial liabilities', 'LE00000', 'AFL0000', 'REVISED', '78859']

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)



In [169]:
with open('C:/Users/TejYadav/Desktop/Tests/annual-balance-sheets-200817.csv') as f:
    lines = list(csv.reader(f))

In [170]:
header, values = lines[0], lines[1:]

In [172]:
data_dict = {h: v for h, v in zip (header, zip(*values))}

In [173]:
data_dict

{'ï»¿Year': ('2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
  '2014.03',
  '2015.03',
  '2016.03',
  '2017.03',
  '2008.03',
  '2009.03',
  '2010.03',
  '2011.03',
  '2012.03',
  '2013.03',
 

In [175]:
class my_dialect(csv.Dialect):
    lineterminator = '\n'
    delimiter = ';'
    quotechar = '"'
    quoting = csv.QUOTE_MINIMAL

In [176]:
reader = csv.reader(f, dialect=my_dialect)

TypeError: argument 1 must be an iterator

In [185]:
#JSON Data

obj = """
{"name": "Wes",
"places_lived": ["United States", "Spain", "Germany"],
"pet": null,
"siblings": [("name": "Scott", "age": 30, "pets": ["Zeus", "Zuko"]),
            "name": "Katie", "age": 38,
            "pets": ["Sixes", "Stache", "Cisco"]}]
}
"""

In [186]:
import json

In [189]:
result = json.loads(obj)

JSONDecodeError: Expecting value: line 5 column 14 (char 98)

In [188]:
asjson = json.dumps(result)

TypeError: Object of type 'DataFrame' is not JSON serializable

In [190]:
result

Unnamed: 0,Year,Institutional_sector_name,Institutional_sector_code,Descriptor,SNA08TRANS,Asset_liability_code,Status,Values
0,2008.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,225544
1,2009.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,243315
2,2010.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,259381
3,2011.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,262596
4,2012.03,Corporate business enterprises,141,Capital Account Opening balances Produced non-...,LS00000,AN10000,REVISED,267100
...,...,...,...,...,...,...,...,...
18715,2013.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,FINAL,53768
18716,2014.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,58559
18717,2015.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,70099
18718,2016.03,Pension funds,261,Financial liabilities Closing balance Total fi...,LE00000,AFL0000,REVISED,76021


In [191]:
asjson = json.dumps(result)

TypeError: Object of type 'DataFrame' is not JSON serializable

In [192]:
siblings = pd.DataFrame(result['siblings'], columns['name', 'age'])

KeyError: 'siblings'