In [1]:
import os
import pandas as pd
from pandas import Series, DataFrame
import country_converter as coco

In [2]:
# https://data.nber.org/data-appendix/w15319/
# https://data.nber.org/data-appendix/w15319/FinalCHAT_72909.csv
# https://www.nber.org/system/files/working_papers/w15319/w15319.pdf


In [3]:
os.chdir('/Users/ariana/desktop/historical_tech')

In [4]:
chat = pd.read_csv('raw data/FinalCHAT_72909.csv')
chat

  chat = pd.read_csv('raw data/FinalCHAT_72909.csv')


Unnamed: 0,country_name,year,ag_harvester,ag_milkingmachine,ag_tractor,atm,aviationpkm,aviationtkm,bed_acute,bed_hosp,...,vehicle_com,visitorbeds,visitorrooms,xlpopulation,xlrealgdp,pctivprimeenroll,pctivsecenroll,pctivprivateinv,pctivpublicinv,pctivliteracy
0,Afghanistan,1750,,,,,,,,,...,,,,,,,,,,
1,Afghanistan,1751,,,,,,,,,...,,,,,,,,,,
2,Afghanistan,1752,,,,,,,,,...,,,,,,,,,,
3,Afghanistan,1753,,,,,,,,,...,,,,,,,,,,
4,Afghanistan,1754,,,,,,,,,...,,,,,,,,,,
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
41694,Zimbabwe,2004,,,,,,,,,...,,,,,,,,,,
41695,Zimbabwe,2005,,,,,,,,,...,,,,,,,,,,
41696,Zimbabwe,2006,,,,,,,,,...,,,,,,,,,,
41697,Zimbabwe,2007,,,,,,,,,...,,,,,,,,,,


In [5]:
chat_dict = pd.read_excel('raw data/chat_dictionary.xlsx', skipfooter=2)
chat_dict

Unnamed: 0,VARIABLE NAME,DEFINITION,SOURCE
0,ag_harvester,Number of self‐propelled machines that reap an...,FAOSTAT (2004)
1,ag_milkingmachine,Number of installations consisting of several ...,FAOSTAT (2004)
2,ag_tractor,Number of wheel and crawler tractors (excludin...,FAOSTAT (2004)
3,atm,Number of electromechanical devices that permi...,BIS (various years) and ECB (various years)
4,aviationpkm,Civil aviation passenger‐KM traveled on schedu...,Mitchell (1998)
...,...,...,...
106,pctivprimeenroll,Primary school enrollment rate,Mitchell and Banks
107,pctivsecenroll,Secondary school enrollment rate,Mitchell and Banks
108,pctivprivateinv,Private investment as a share of GDP,Penn World Table (2007)
109,pctivpublicinv,Public investment as a share of GDP,Penn World Table (2007)


In [6]:
var_names = list(chat.columns[2:])
var_names

['ag_harvester',
 'ag_milkingmachine',
 'ag_tractor',
 'atm',
 'aviationpkm',
 'aviationtkm',
 'bed_acute',
 'bed_hosp',
 'bed_longterm',
 'cabletv',
 'cellphone',
 'cheque',
 'computer',
 'creditdebit',
 'eft',
 'elecprod',
 'fert_total',
 'internetuser',
 'irrigatedarea',
 'kidney_dialpat',
 'kidney_homedialpat',
 'loom_auto',
 'loom_total',
 'mail',
 'med_catscanner',
 'med_lithotriptor',
 'med_mammograph',
 'med_mriunit',
 'med_radiationequip',
 'newspaper',
 'pctdaysurg_cataract',
 'pctdaysurg_cholecyst',
 'pctdaysurg_hernia',
 'pctdaysurg_lapcholecyst',
 'pctdaysurg_tonsil',
 'pctdaysurg_varicosevein',
 'pcthomedialysis',
 'pctimmunizdpt',
 'pctimmunizmeas',
 'pctirrigated',
 'pctmvbyarea',
 'pest_total',
 'pos',
 'radio',
 'railline',
 'railp',
 'railpkm',
 'railt',
 'railtkm',
 'ship_all',
 'ship_motor',
 'ship_sail',
 'ship_steam',
 'ship_steammotor',
 'shipton_all',
 'shipton_motor',
 'shipton_sail',
 'shipton_steam',
 'shipton_steammotor',
 'spindle_mule',
 'spindle_ring',
 

In [7]:
def read_chat(col_num, tech_name, unit='Number in Use', metric='Cumulative total capacity'):
    chat = pd.read_csv('raw data/FinalCHAT_72909.csv', usecols=[0,1,col_num])
    chat.replace('Venezuala', 'Venezuela', inplace=True)
    country_list = list(set(chat['country_name']))
    chat_df = []
    for country in country_list:
        df = chat[chat['country_name']==country]
        df.set_index('year', drop=True, inplace=True)
        df = df.transpose()
        df['Country Name'] = country
        if country == 'North Vietnam':
            country_code = 'VD'
        elif country == 'South Vietnam':
            country_code = 'VN'
        else:
            country_code = coco.convert(names=country, to='iso2')
        df['Country Code'] = country_code
        df.drop(index='country_name', inplace=True)
        chat_df.append(df)
    chat_all = pd.concat(chat_df)
    chat_all['Data Source'] = 'NBER CHAT'
    chat_all['Spatial Scale'] = 'National'
    chat_all['Unit'] = unit
    chat_all['Metric'] = metric
    chat_all['Technology Name'] = tech_name
    chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']
    chat_all.set_index('ID', drop=True, inplace=True)
    chat_all.columns.name = None
    omit = []
    for col in chat_all.columns:
        if type(col) != int:
            omit.append(col)
    empty_rows = chat_all.drop(columns=omit)
    empty_rows.dropna(how='all', inplace=True)
    na_idx = []
    for country in chat_all.index:
        if country not in empty_rows.index:
            na_idx.append(country)
    chat_all.drop(na_idx, inplace=True)
    file_name = 'cleaned data/chat_' + tech_name + '.csv'
    chat_all.to_csv(file_name)
    return chat_all


In [8]:
ag_harvester = read_chat(2, 'Crop harvester', metric='Total Number')
ag_harvester

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Crop harvester_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_BO,,,,,,,,,,,...,,,,Bolivia,BO,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_DE,,,,,,,,,,,...,,,,Germany,DE,NBER CHAT,National,Number in Use,Total Number,Crop harvester
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Crop harvester_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number in Use,Total Number,Crop harvester
Crop harvester_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number in Use,Total Number,Crop harvester


In [9]:
steam_ships = read_chat(54, 'Steam ships')
steam_ships

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Steam ships_Cumulative total capacity_DE,,,,,,,,,,,...,,,,Germany,DE,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_IE,,,,,,,,,,,...,,,,Ireland,IE,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_FR,,,,,,,,,,,...,,,,France,FR,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_FI,,,,,,,,,,,...,,,,Finland,FI,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_RU,,,,,,,,,,,...,,,,Russia,RU,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_AT,,,,,,,,,,,...,,,,Austria,AT,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_GR,,,,,,,,,,,...,,,,Greece,GR,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_DK,,,,,,,,,,,...,,,,Denmark,DK,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_MX,,,,,,,,,,,...,,,,Mexico,MX,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships
Steam ships_Cumulative total capacity_ES,,,,,,,,,,,...,,,,Spain,ES,NBER CHAT,National,Number in Use,Cumulative total capacity,Steam ships


In [10]:
telephones = read_chat(91, 'Telephones', metric='Total Number')
telephones

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Telephones_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number in Use,Total Number,Telephones
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Telephones_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number in Use,Total Number,Telephones
Telephones_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number in Use,Total Number,Telephones


In [11]:
rail = read_chat(46, 'Railroad', unit='Length of railway open in kilometers',metric='Cumulative Length')
rail

  chat = pd.read_csv('raw data/FinalCHAT_72909.csv', usecols=[0,1,col_num])
  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Railroad_Cumulative Length_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_MU,,,,,,,,,,,...,,,,Mauritius,MU,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Railroad_Cumulative Length_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad
Railroad_Cumulative Length_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Length of railway open in kilometers,Cumulative Length,Railroad


In [12]:
tv = read_chat(97, 'Television', metric='Total Number')
tv

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Television_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number in Use,Total Number,Television
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Television_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number in Use,Total Number,Television
Television_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number in Use,Total Number,Television


In [13]:
# Radio	CHAT database (radio)
radio = read_chat(45, 'Radio', metric='Total Number')
radio

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Radio_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number in Use,Total Number,Radio
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Radio_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number in Use,Total Number,Radio
Radio_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number in Use,Total Number,Radio


In [14]:
# Passenger Cars	CHAT (vehicle_car)
cars = read_chat(102, 'Passenger Cars', metric='Total Number')
cars

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Passenger Cars_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Passenger Cars_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number in Use,Total Number,Passenger Cars
Passenger Cars_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number in Use,Total Number,Passenger Cars


In [15]:
# Telegraph Traffic	CHAT (telegram)

telegram = read_chat(90, 'Telegraph Traffic', 'Number of telegrams sent annually', 'Total Number')
telegram

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Telegraph Traffic_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_DE,,,,,,,,,,,...,,,,Germany,DE,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_ZA,,,,,,,,,,,...,,,,South Africa,ZA,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Telegraph Traffic_Total Number_PH,,,,,,,,,,,...,,,,Philippines,PH,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_MW,,,,,,,,,,,...,,,,Malawi,MW,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic
Telegraph Traffic_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number of telegrams sent annually,Total Number,Telegraph Traffic


In [16]:
# Postal traffic	CHAT (mail)

mail = read_chat(25, 'Postal Traffic', 'Number of items mailed/received', metric='Total Number')
mail

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Postal Traffic_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_MU,,,,,,,,,,,...,,,,Mauritius,MU,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_DE,,,,,,,,,,,...,,,,Germany,DE,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_ZA,,,,,,,,,,,...,,,,South Africa,ZA,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Postal Traffic_Total Number_MW,,,,,,,,,,,...,,,,Malawi,MW,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic
Postal Traffic_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number of items mailed/received,Total Number,Postal Traffic


In [17]:
# Cellphones	CHAT (cellphone)

cells = read_chat(12, 'Cellphones', unit='Number of users', metric='Total Number')
cells

  chat_all['Data Source'] = 'NBER CHAT'
  chat_all['Spatial Scale'] = 'National'
  chat_all['Unit'] = unit
  chat_all['Metric'] = metric
  chat_all['Technology Name'] = tech_name
  chat_all['ID'] = chat_all['Technology Name'] + '_' + chat_all['Metric'] + '_' + chat_all['Country Code']


Unnamed: 0_level_0,1750,1751,1752,1753,1754,1755,1756,1757,1758,1759,...,2006,2007,2008,Country Name,Country Code,Data Source,Spatial Scale,Unit,Metric,Technology Name
ID,Unnamed: 1_level_1,Unnamed: 2_level_1,Unnamed: 3_level_1,Unnamed: 4_level_1,Unnamed: 5_level_1,Unnamed: 6_level_1,Unnamed: 7_level_1,Unnamed: 8_level_1,Unnamed: 9_level_1,Unnamed: 10_level_1,Unnamed: 11_level_1,Unnamed: 12_level_1,Unnamed: 13_level_1,Unnamed: 14_level_1,Unnamed: 15_level_1,Unnamed: 16_level_1,Unnamed: 17_level_1,Unnamed: 18_level_1,Unnamed: 19_level_1,Unnamed: 20_level_1,Unnamed: 21_level_1
Cellphones_Total Number_TG,,,,,,,,,,,...,,,,Togo,TG,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_BR,,,,,,,,,,,...,,,,Brazil,BR,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_TD,,,,,,,,,,,...,,,,Chad,TD,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_TZ,,,,,,,,,,,...,,,,Tanzania,TZ,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_SR,,,,,,,,,,,...,,,,Suriname,SR,NBER CHAT,National,Number of users,Total Number,Cellphones
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
Cellphones_Total Number_CA,,,,,,,,,,,...,,,,Canada,CA,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_RO,,,,,,,,,,,...,,,,Romania,RO,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_GB,,,,,,,,,,,...,,,,United Kingdom,GB,NBER CHAT,National,Number of users,Total Number,Cellphones
Cellphones_Total Number_ER,,,,,,,,,,,...,,,,Eritrea,ER,NBER CHAT,National,Number of users,Total Number,Cellphones


In [18]:
for var_def in chat_dict[chat_dict[chat_dict.columns[0]]=='telephone'][chat_dict.columns[1]]:
    print(var_def)

Number of mainline telephone lines connecting a customer's equipment to the public switched telephone network as of year end


In [19]:
for var_idx in chat_dict[chat_dict[chat_dict.columns[0]]=='ag_harvester'].index:
    print(var_idx)

0


In [20]:
chat_dict.iloc[89]

VARIABLE NAME                                             telephone
DEFINITION        Number of mainline telephone lines connecting ...
SOURCE                           Mitchell (1998), WORLD BANK (2007)
Name: 89, dtype: object