In [157]:
# Dependencies
import numpy as np
import pandas as pd
import datetime as dt

# Python SQL toolkit and Object Relational Mapper
import sqlalchemy
from sqlalchemy.ext.automap import automap_base
from sqlalchemy.orm import Session
from sqlalchemy import create_engine, func

In [158]:
# create engine
#engine = create_engine("sqlite:///covid.sqlite")
engine = create_engine("sqlite:///database/covid.sqlite")

# reflect an existing database into a new model
Base = automap_base()
# reflect the tables
Base.prepare(engine, reflect=True)


In [159]:
# Save references to the table
Covid = Base.classes.owid_covid_data

In [160]:
# Create our session (link) from Python to the DB
session = Session(engine)

In [161]:
# 1. Import the sqlalchemy extract function.
from sqlalchemy import extract

# 2. Write a query that filters the Measurement table to retrieve the 'USA' total_cases. 
#results = session.query(Owid.date, Owid.iso_code, Owid.total_cases).filter(Owid.iso_code == 'USA').all()
results = session.query(Covid.date, Covid.total_cases).filter(Covid.iso_code == 'USA').all()
results

[('2020-01-22', 1.0),
 ('2020-01-23', 1.0),
 ('2020-01-24', 2.0),
 ('2020-01-25', 2.0),
 ('2020-01-26', 5.0),
 ('2020-01-27', 5.0),
 ('2020-01-28', 5.0),
 ('2020-01-29', 6.0),
 ('2020-01-30', 6.0),
 ('2020-01-31', 8.0),
 ('2020-02-01', 8.0),
 ('2020-02-02', 8.0),
 ('2020-02-03', 11.0),
 ('2020-02-04', 11.0),
 ('2020-02-05', 11.0),
 ('2020-02-06', 12.0),
 ('2020-02-07', 12.0),
 ('2020-02-08', 12.0),
 ('2020-02-09', 12.0),
 ('2020-02-10', 12.0),
 ('2020-02-11', 13.0),
 ('2020-02-12', 13.0),
 ('2020-02-13', 14.0),
 ('2020-02-14', 14.0),
 ('2020-02-15', 14.0),
 ('2020-02-16', 14.0),
 ('2020-02-17', 14.0),
 ('2020-02-18', 14.0),
 ('2020-02-19', 14.0),
 ('2020-02-20', 14.0),
 ('2020-02-21', 16.0),
 ('2020-02-22', 16.0),
 ('2020-02-23', 16.0),
 ('2020-02-24', 16.0),
 ('2020-02-25', 16.0),
 ('2020-02-26', 16.0),
 ('2020-02-27', 17.0),
 ('2020-02-28', 17.0),
 ('2020-02-29', 25.0),
 ('2020-03-01', 32.0),
 ('2020-03-02', 55.0),
 ('2020-03-03', 74.0),
 ('2020-03-04', 107.0),
 ('2020-03-05', 184.0)

In [162]:
#  3. Convert the 'USA' total_cases to a list.
usa_total_cases_list = [result for result in results]

In [163]:
usa_total_cases_list

[('2020-01-22', 1.0),
 ('2020-01-23', 1.0),
 ('2020-01-24', 2.0),
 ('2020-01-25', 2.0),
 ('2020-01-26', 5.0),
 ('2020-01-27', 5.0),
 ('2020-01-28', 5.0),
 ('2020-01-29', 6.0),
 ('2020-01-30', 6.0),
 ('2020-01-31', 8.0),
 ('2020-02-01', 8.0),
 ('2020-02-02', 8.0),
 ('2020-02-03', 11.0),
 ('2020-02-04', 11.0),
 ('2020-02-05', 11.0),
 ('2020-02-06', 12.0),
 ('2020-02-07', 12.0),
 ('2020-02-08', 12.0),
 ('2020-02-09', 12.0),
 ('2020-02-10', 12.0),
 ('2020-02-11', 13.0),
 ('2020-02-12', 13.0),
 ('2020-02-13', 14.0),
 ('2020-02-14', 14.0),
 ('2020-02-15', 14.0),
 ('2020-02-16', 14.0),
 ('2020-02-17', 14.0),
 ('2020-02-18', 14.0),
 ('2020-02-19', 14.0),
 ('2020-02-20', 14.0),
 ('2020-02-21', 16.0),
 ('2020-02-22', 16.0),
 ('2020-02-23', 16.0),
 ('2020-02-24', 16.0),
 ('2020-02-25', 16.0),
 ('2020-02-26', 16.0),
 ('2020-02-27', 17.0),
 ('2020-02-28', 17.0),
 ('2020-02-29', 25.0),
 ('2020-03-01', 32.0),
 ('2020-03-02', 55.0),
 ('2020-03-03', 74.0),
 ('2020-03-04', 107.0),
 ('2020-03-05', 184.0)

In [164]:
# 4. Create a DataFrame from the list of 'USA' total_cases. 
df = pd.DataFrame(usa_total_cases_list, columns=['Date', 'Total USA Cases'])
df

Unnamed: 0,Date,Total USA Cases
0,2020-01-22,1.0
1,2020-01-23,1.0
2,2020-01-24,2.0
3,2020-01-25,2.0
4,2020-01-26,5.0
...,...,...
325,2020-12-12,16143219.0
326,2020-12-13,16334361.0
327,2020-12-14,16527207.0
328,2020-12-15,16725973.0


In [165]:
results_table = session.query(Covid).filter().all()

In [166]:
list = [res_table for res_table in results_table]
list

[<sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bcc9f60>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bcc9fd0>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3080>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe30f0>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3160>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe31d0>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3240>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe32b0>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3320>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe33c8>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3470>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3518>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe35c0>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3668>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe3710>,
 <sqlalchemy.ext.automap.owid_covid_data at 0x7fa37bfe37b8>,
 <sqlalchemy.ext.automap

In [167]:
df = pd.DataFrame(list)
df

Unnamed: 0,0
0,<sqlalchemy.ext.automap.owid_covid_data object...
1,<sqlalchemy.ext.automap.owid_covid_data object...
2,<sqlalchemy.ext.automap.owid_covid_data object...
3,<sqlalchemy.ext.automap.owid_covid_data object...
4,<sqlalchemy.ext.automap.owid_covid_data object...
...,...
54551,<sqlalchemy.ext.automap.owid_covid_data object...
54552,<sqlalchemy.ext.automap.owid_covid_data object...
54553,<sqlalchemy.ext.automap.owid_covid_data object...
54554,<sqlalchemy.ext.automap.owid_covid_data object...


In [168]:
for m in session.query(*Covid.__table__.columns).all():
    print (m)

('AFG', 'Asia', 'Afghanistan', '2020-02-24', 1.0, None, None, None, None, None, 0.026, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 8.33, 38928341.0, 54.422, 18.6, 2.581, 1.337, 1803.987, None, 597.029, 9.59, None, None, 37.746, 0.5, 64.83, 0.498, 1)
('AFG', 'Asia', 'Afghanistan', '2020-02-25', 1.0, '0.0', None, None, None, None, 0.026, '0.0', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 8.33, 38928341.0, 54.422, 18.6, 2.581, 1.337, 1803.987, None, 597.029, 9.59, None, None, 37.746, 0.5, 64.83, 0.498, 2)
('AFG', 'Asia', 'Afghanistan', '2020-02-26', 1.0, '0.0', None, None, None, None, 0.026, '0.0', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 8.33, 38928341.0, 54.422, 18.6, 2.581, 1.337, 1

('ARG', 'South America', 'Argentina', '2020-04-18', 2758.0, '89.0', '111.857', '129.0', '6.0', '6.571', 61.023, '1.969', '2.475', '2.854', '0.133', '0.145', '1.25', None, None, None, None, None, None, None, None, '1640.0', '30159.0', '0.667', '0.036', '1562.0', '0.035', '0.072', '14.0', 'people tested', None, None, 100.0, 45195777.0, 16.177, 31.9, 11.198, 7.441, 18933.907, '0.6', 191.032, 5.5, '16.2', '27.7', None, 5.0, 76.67, 0.825, 1794)
('ARG', 'South America', 'Argentina', '2020-04-19', 2839.0, '81.0', '99.571', '132.0', '3.0', '6.0', 62.816, '1.792', '2.203', '2.921', '0.066', '0.133', '1.25', None, None, None, None, None, None, None, None, '1182.0', '31341.0', '0.693', '0.026', '1579.0', '0.035', '0.063', '15.9', 'people tested', None, None, 100.0, 45195777.0, 16.177, 31.9, 11.198, 7.441, 18933.907, '0.6', 191.032, 5.5, '16.2', '27.7', None, 5.0, 76.67, 0.825, 1795)
('ARG', 'South America', 'Argentina', '2020-04-20', 2941.0, '102.0', '104.714', '136.0', '4.0', '5.571', 65.072, '2

('BHR', 'Asia', 'Bahrain', '2020-11-27', 86515.0, '168.0', '149.714', '341.0', '0.0', '0.429', 50843.832, '98.732', '87.985', '200.402', '0.0', '0.252', '0.91', None, None, None, None, None, None, None, None, '12388.0', '2015598.0', '1184.543', '7.28', '10078.0', '5.923', '0.015', '67.3', 'units unclear', None, None, 58.33, 1701583.0, 1935.907, 32.4, 2.372, 1.387, 43290.705, None, 151.689, 16.52, '5.8', '37.6', None, 2.0, 77.29, 0.846, 3794)
('BHR', 'Asia', 'Bahrain', '2020-11-28', 86645.0, '130.0', '150.571', '341.0', '0.0', '0.429', 50920.231, '76.399', '88.489', '200.402', '0.0', '0.252', '0.91', None, None, None, None, None, None, None, None, '10176.0', '2025774.0', '1190.523', '5.98', '10177.0', '5.981', '0.015', '67.6', 'units unclear', None, None, 58.33, 1701583.0, 1935.907, 32.4, 2.372, 1.387, 43290.705, None, 151.689, 16.52, '5.8', '37.6', None, 2.0, 77.29, 0.846, 3795)
('BHR', 'Asia', 'Bahrain', '2020-11-29', 86787.0, '142.0', '154.571', '341.0', '0.0', '0.429', 51003.683, '8

('BEN', 'Africa', 'Benin', '2020-04-19', 35.0, '0.0', '0.0', '1.0', '0.0', '0.0', 2.887, '0.0', '0.0', '0.082', '0.0', '0.0', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 70.83, 12123198.0, 99.11, 18.8, 3.244, 1.942, 2064.236, '49.6', 235.848, 0.99, '0.6', '12.3', 11.035, 0.5, 61.77, 0.515, 5293)
('BEN', 'Africa', 'Benin', '2020-04-20', 54.0, '19.0', '2.714', '1.0', '0.0', '0.0', 4.454, '1.567', '0.224', '0.082', '0.0', '0.0', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 70.83, 12123198.0, 99.11, 18.8, 3.244, 1.942, 2064.236, '49.6', 235.848, 0.99, '0.6', '12.3', 11.035, 0.5, 61.77, 0.515, 5294)
('BEN', 'Africa', 'Benin', '2020-04-21', 54.0, '0.0', '2.714', '1.0', '0.0', '0.0', 4.454, '0.0', '0.224', '0.082', '0.0', '0.0', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, Non

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)




('KEN', 'Africa', 'Kenya', '2020-06-20', 4478.0, '104.0', '145.857', '121.0', '2.0', '3.0', 83.279, '1.934', '2.713', '2.25', '0.037', '0.056', '1.21', None, None, None, None, None, None, None, None, '2820.0', '136361.0', '2.536', '0.052', '3456.0', '0.064', '0.042', '23.7', 'samples tested', None, None, 88.89, 53771300.0, 87.324, 20.0, 2.686, 1.528, 2993.028, '36.8', 218.637, 2.92, '1.2', '20.4', 24.651, 1.4, 66.7, 0.59, 25788)
('KEN', 'Africa', 'Kenya', '2020-06-21', 4738.0, '260.0', '163.429', '123.0', '2.0', '2.857', 88.114, '4.835', '3.039', '2.287', '0.037', '0.053', '1.22', None, None, None, None, None, None, None, None, '3651.0', '140012.0', '2.604', '0.068', '3525.0', '0.066', '0.046', '21.6', 'samples tested', None, None, 88.89, 53771300.0, 87.324, 20.0, 2.686, 1.528, 2993.028, '36.8', 218.637, 2.92, '1.2', '20.4', 24.651, 1.4, 66.7, 0.59, 25789)
('KEN', 'Africa', 'Kenya', '2020-06-22', 4797.0, '59.0', '152.857', '125.0', '2.0', '3.0', 89.211, '1.097', '2.843', '2.325', '0.0

('LSO', 'Africa', 'Lesotho', '2020-08-26', 1051.0, '2.0', '15.0', '31.0', '1.0', '0.143', 490.605, '0.934', '7.002', '14.471', '0.467', '0.067', '0.9', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 71.3, 2142252.0, 73.562, 22.2, 4.506, 2.647, 2851.153, '59.6', 405.126, 3.94, '0.4', '53.9', 2.117, None, 54.33, 0.52, 27786)
('LSO', 'Africa', 'Lesotho', '2020-08-27', 1051.0, '0.0', '7.857', '31.0', '0.0', '0.143', 490.605, '0.0', '3.668', '14.471', '0.0', '0.067', '0.9', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 71.3, 2142252.0, 73.562, 22.2, 4.506, 2.647, 2851.153, '59.6', 405.126, 3.94, '0.4', '53.9', 2.117, None, 54.33, 0.52, 27787)
('LSO', 'Africa', 'Lesotho', '2020-08-28', 1051.0, '0.0', '5.143', '31.0', '0.0', '0.143', 490.605, '0.0', '2.401', '14.471', '0.0', '0.067', '0.9', None, None, None, None, None, None, None, None, None, None, None, None

('MDG', 'Africa', 'Madagascar', '2020-08-17', 13886.0, '59.0', '97.714', '171.0', '1.0', '2.857', 501.462, '2.131', '3.529', '6.175', '0.036', '0.103', '0.72', None, None, None, None, None, None, None, None, '336.0', '52657.0', '1.902', '0.012', '490.0', '0.018', '0.199', '5.0', 'tests performed', None, None, 65.74, 27691019.0, 43.951, 19.6, 2.929, 1.686, 1416.44, '77.6', 405.994, 3.94, None, None, 50.54, 0.2, 67.04, 0.519, 29492)
('MDG', 'Africa', 'Madagascar', '2020-08-18', 14009.0, '123.0', '98.857', '173.0', '2.0', '3.0', 505.904, '4.442', '3.57', '6.248', '0.072', '0.108', '0.72', None, None, None, None, None, None, None, None, '621.0', '53278.0', '1.924', '0.022', '505.0', '0.018', '0.196', '5.1', 'tests performed', None, None, 65.74, 27691019.0, 43.951, 19.6, 2.929, 1.686, 1416.44, '77.6', 405.994, 3.94, None, None, 50.54, 0.2, 67.04, 0.519, 29493)
('MDG', 'Africa', 'Madagascar', '2020-08-19', 14074.0, '65.0', '96.714', '173.0', '0.0', '2.429', 508.251, '2.347', '3.493', '6.248'

IOPub data rate exceeded.
The notebook server will temporarily stop sending output
to the client in order to avoid crashing it.
To change this limit, set the config variable
`--NotebookApp.iopub_data_rate_limit`.

Current values:
NotebookApp.iopub_data_rate_limit=1000000.0 (bytes/sec)
NotebookApp.rate_limit_window=3.0 (secs)




('UZB', 'Asia', 'Uzbekistan', '2020-11-03', 67553.0, '299.0', '238.857', '574.0', '3.0', '2.571', 2018.363, '8.934', '7.137', '17.15', '0.09', '0.077', '0.89', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 39.81, 33469199.0, 76.134, 28.2, 4.469, 2.873, 6253.104, None, 724.417, 7.57, '1.3', '24.7', None, 4.0, 71.72, 0.71, 52456)
('UZB', 'Asia', 'Uzbekistan', '2020-11-04', 67779.0, '226.0', '234.0', '577.0', '3.0', '2.714', 2025.116, '6.752', '6.992', '17.24', '0.09', '0.081', '0.89', None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, None, 39.81, 33469199.0, 76.134, 28.2, 4.469, 2.873, 6253.104, None, 724.417, 7.57, '1.3', '24.7', None, 4.0, 71.72, 0.71, 52457)
('UZB', 'Asia', 'Uzbekistan', '2020-11-05', 68009.0, '230.0', '231.0', '579.0', '2.0', '2.571', 2031.988, '6.872', '6.902', '17.299', '0.06', '0.077', '0.9', None, None, None, None, None, None, None, None,

('ZMB', 'Africa', 'Zambia', '2020-12-11', 18161.0, '70.0', '43.429', '365.0', '1.0', '0.143', 987.872, '3.808', '2.362', '19.854', '0.054', '0.008', None, None, None, None, None, None, None, None, None, '3755.0', '471542.0', '25.65', '0.204', '5841.0', '0.318', '0.007', '134.5', 'tests performed', None, None, 45.37, 18383956.0, 22.995, 17.7, 2.48, 1.542, 3689.251, '57.5', 234.499, 3.94, '3.1', '24.7', 13.938, 2.0, 63.89, 0.588, 54279)
('ZMB', 'Africa', 'Zambia', '2020-12-12', 18217.0, '56.0', '45.571', '366.0', '1.0', '0.286', 990.918, '3.046', '2.479', '19.909', '0.054', '0.016', None, None, None, None, None, None, None, None, None, '5632.0', '477174.0', '25.956', '0.306', '5807.0', '0.316', '0.008', '127.4', 'tests performed', None, None, 45.37, 18383956.0, 22.995, 17.7, 2.48, 1.542, 3689.251, '57.5', 234.499, 3.94, '3.1', '24.7', 13.938, 2.0, 63.89, 0.588, 54280)
('ZMB', 'Africa', 'Zambia', '2020-12-13', 18274.0, '57.0', '51.143', '367.0', '1.0', '0.429', 994.019, '3.101', '2.782', 

In [169]:
list = [res_table for res_table in session.query(*Covid.__table__.columns).all()]
list

[('AFG',
  'Asia',
  'Afghanistan',
  '2020-02-24',
  1.0,
  None,
  None,
  None,
  None,
  None,
  0.026,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  8.33,
  38928341.0,
  54.422,
  18.6,
  2.581,
  1.337,
  1803.987,
  None,
  597.029,
  9.59,
  None,
  None,
  37.746,
  0.5,
  64.83,
  0.498,
  1),
 ('AFG',
  'Asia',
  'Afghanistan',
  '2020-02-25',
  1.0,
  '0.0',
  None,
  None,
  None,
  None,
  0.026,
  '0.0',
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  None,
  8.33,
  38928341.0,
  54.422,
  18.6,
  2.581,
  1.337,
  1803.987,
  None,
  597.029,
  9.59,
  None,
  None,
  37.746,
  0.5,
  64.83,
  0.498,
  2),
 ('AFG',
  'Asia',
  'Afghanistan',
  '2020-02-26',
  1.0,
  '0.0',
  None

In [170]:
df = pd.DataFrame(list)
df

Unnamed: 0,iso_code,continent,location,date,total_cases,new_cases,new_cases_smoothed,total_deaths,new_deaths,new_deaths_smoothed,...,extreme_poverty,cardiovasc_death_rate,diabetes_prevalence,female_smokers,male_smokers,handwashing_facilities,hospital_beds_per_thousand,life_expectancy,human_development_index,id
0,AFG,Asia,Afghanistan,2020-02-24,1.0,,,,,,...,,597.029,9.59,,,37.746,0.5,64.83,0.498,1
1,AFG,Asia,Afghanistan,2020-02-25,1.0,0.0,,,,,...,,597.029,9.59,,,37.746,0.5,64.83,0.498,2
2,AFG,Asia,Afghanistan,2020-02-26,1.0,0.0,,,,,...,,597.029,9.59,,,37.746,0.5,64.83,0.498,3
3,AFG,Asia,Afghanistan,2020-02-27,1.0,0.0,,,,,...,,597.029,9.59,,,37.746,0.5,64.83,0.498,4
4,AFG,Asia,Afghanistan,2020-02-28,1.0,0.0,,,,,...,,597.029,9.59,,,37.746,0.5,64.83,0.498,5
...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...,...
54551,ZWE,Africa,Zimbabwe,2020-12-12,11219.0,57.0,86.0,307.0,1.0,2.286,...,21.4,307.846,1.82,1.6,30.7,36.791,1.7,61.49,0.535,54552
54552,ZWE,Africa,Zimbabwe,2020-12-13,11246.0,27.0,75.429,307.0,0.0,2.286,...,21.4,307.846,1.82,1.6,30.7,36.791,1.7,61.49,0.535,54553
54553,ZWE,Africa,Zimbabwe,2020-12-14,11358.0,112.0,74.143,309.0,2.0,2.143,...,21.4,307.846,1.82,1.6,30.7,36.791,1.7,61.49,0.535,54554
54554,ZWE,Africa,Zimbabwe,2020-12-15,11522.0,164.0,87.143,310.0,1.0,1.0,...,21.4,307.846,1.82,1.6,30.7,36.791,1.7,61.49,0.535,54555


In [171]:
df.dtypes

iso_code                               object
continent                              object
location                               object
date                                   object
total_cases                           float64
new_cases                              object
new_cases_smoothed                     object
total_deaths                           object
new_deaths                             object
new_deaths_smoothed                    object
total_cases_per_million               float64
new_cases_per_million                  object
new_cases_smoothed_per_million         object
total_deaths_per_million               object
new_deaths_per_million                 object
new_deaths_smoothed_per_million        object
reproduction_rate                      object
icu_patients                           object
icu_patients_per_million               object
hosp_patients                          object
hosp_patients_per_million              object
weekly_icu_admissions             

In [172]:
df['new_cases'] = pd.to_numeric(df['new_cases'])

In [173]:
df.dtypes


iso_code                               object
continent                              object
location                               object
date                                   object
total_cases                           float64
new_cases                             float64
new_cases_smoothed                     object
total_deaths                           object
new_deaths                             object
new_deaths_smoothed                    object
total_cases_per_million               float64
new_cases_per_million                  object
new_cases_smoothed_per_million         object
total_deaths_per_million               object
new_deaths_per_million                 object
new_deaths_smoothed_per_million        object
reproduction_rate                      object
icu_patients                           object
icu_patients_per_million               object
hosp_patients                          object
hosp_patients_per_million              object
weekly_icu_admissions             

In [174]:
#df = df.astype({'new_cases': 'float64', 'weekly_icu_admissions':'float64', 'weekly_icu_admissions_per_million':'float64','weekly_hosp_admissions':'float64', 'weekly_hosp_admissions_per_million':'float64', 'new_test':'float64', 'total_tests':'float64','total_tests_per_thousand':'float64','new_tests_per_thousand':'float64','new_tests_smoothed':'float64','new_tests_smoothed_per_thousand':'float64' ,'positive_rate':'float64', 'tests_per_case':'float64','tests_units':'float64', 'total_vaccinations':'float64', 'total_vaccinations_per_hundred':'float64', 'extreme_poverty':'float64', 'female_smoakers':'float64'','weekly_icu_admissions_per_million':'float64','weekly_hosp_admissions':'float64', 'weekly_hosp_admissions_per_million':'float64', 'new_test':'float64', 'total_tests':'float64','total_tests_per_thousand':'float64','new_tests_per_thousand':'float64','new_tests_smoothed':'float64','new_tests_smoothed_per_thousand':'float64' ,'positive_rate':'float64', 'tests_per_case':'float64','tests_units':'float64', 'total_vaccinations':'float64', 'total_vaccinations_per_hundred':'float64', 'extreme_poverty':'float64', 'female_smoakers':'float64', 'male_smokers':'float64'})

In [175]:
lists = [col for col in df.columns]
lists

['iso_code',
 'continent',
 'location',
 'date',
 'total_cases',
 'new_cases',
 'new_cases_smoothed',
 'total_deaths',
 'new_deaths',
 'new_deaths_smoothed',
 'total_cases_per_million',
 'new_cases_per_million',
 'new_cases_smoothed_per_million',
 'total_deaths_per_million',
 'new_deaths_per_million',
 'new_deaths_smoothed_per_million',
 'reproduction_rate',
 'icu_patients',
 'icu_patients_per_million',
 'hosp_patients',
 'hosp_patients_per_million',
 'weekly_icu_admissions',
 'weekly_icu_admissions_per_million',
 'weekly_hosp_admissions',
 'weekly_hosp_admissions_per_million',
 'new_tests',
 'total_tests',
 'total_tests_per_thousand',
 'new_tests_per_thousand',
 'new_tests_smoothed',
 'new_tests_smoothed_per_thousand',
 'positive_rate',
 'tests_per_case',
 'tests_units',
 'total_vaccinations',
 'total_vaccinations_per_hundred',
 'stringency_index',
 'population',
 'population_density',
 'median_age',
 'aged_65_older',
 'aged_70_older',
 'gdp_per_capita',
 'extreme_poverty',
 'cardiova