# Hands on!

In [155]:
import pandas as pd
import numpy as np


# Pandas Series

In [156]:
g7_pop = pd.Series([35.467, 63.951, 80.940, 60.665, 127.061, 64.511, 318.523])

In [157]:
g7_pop

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
dtype: float64

In [158]:
g7_pop.name = 'G7 Population in millions'

In [159]:
g7_pop

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
Name: G7 Population in millions, dtype: float64

In [160]:
g7_pop.dtype

dtype('float64')

In [161]:
g7_pop.values

array([ 35.467,  63.951,  80.94 ,  60.665, 127.061,  64.511, 318.523])

In [162]:
type(g7_pop.values)

numpy.ndarray

In [163]:
g7_pop

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
Name: G7 Population in millions, dtype: float64

In [164]:
g7_pop[0]

35.467

In [165]:
g7_pop[1]

63.951

In [166]:
g7_pop.index

RangeIndex(start=0, stop=7, step=1)

In [167]:
l = ['a', 'b', 'c']

In [168]:
g7_pop.index = [
    'Canada',
    'France',
    'Germany',
    'Italy',
    'Japan',
    'United Kingdom',
    'United States'
]

In [169]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [170]:
pd.Series({
    'Canada' : 35.467,
    'France' : 63.951,
    'Germany' : 80.94,
    'Italy' : 60.665,
    'Japan' : 127.061,
    'United Kingdom' : 64.511,
    'United States' : 318.523
}, name='G7 Population in millions')

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [171]:
pd.Series(g7_pop, index=['France', 'Germany', 'Italy', 'Spain'])

France     63.951
Germany    80.940
Italy      60.665
Spain         NaN
Name: G7 Population in millions, dtype: float64

# Indexing

In [172]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [173]:
g7_pop['Canada']

35.467

In [174]:
g7_pop['Japan']

127.061

In [175]:
g7_pop.iloc[0]

35.467

In [176]:
g7_pop.iloc[-1]

318.523

In [177]:
g7_pop[['Italy', 'France']]

Italy     60.665
France    63.951
Name: G7 Population in millions, dtype: float64

In [178]:
g7_pop.iloc[[0, 1]]

Canada    35.467
France    63.951
Name: G7 Population in millions, dtype: float64

In [179]:
g7_pop['Canada' : 'Italy']

Canada     35.467
France     63.951
Germany    80.940
Italy      60.665
Name: G7 Population in millions, dtype: float64

In [180]:
l[:2]

['a', 'b']

# Conditional selection (boolean arrays)

In [181]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [182]:
g7_pop > 70

Canada            False
France            False
Germany            True
Italy             False
Japan              True
United Kingdom    False
United States      True
Name: G7 Population in millions, dtype: bool

In [183]:
g7_pop[g7_pop > 70]

Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in millions, dtype: float64

In [184]:
g7_pop.mean()

107.30257142857144

In [185]:
g7_pop[g7_pop > g7_pop.mean()]

Japan            127.061
United States    318.523
Name: G7 Population in millions, dtype: float64

In [186]:
g7_pop.std()

97.24996987121581

In [187]:
g7_pop[(g7_pop > g7_pop.mean() - g7_pop.std() / 2) | (g7_pop > g7_pop.mean() + g7_pop.std() / 2)]

France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

# Operations and methods

In [188]:
pd.Series(g7_pop * 1_000_000, dtype=int)

Canada             35467000
France             63951000
Germany            80940000
Italy              60665000
Japan             127061000
United Kingdom     64510999
United States     318523000
Name: G7 Population in millions, dtype: int64

In [189]:
g7_pop.mean()

107.30257142857144

In [190]:
g7_pop['France' : 'Italy'].mean()

68.51866666666666

# Boolean arrays

In [191]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [192]:
g7_pop > 80

Canada            False
France            False
Germany            True
Italy             False
Japan              True
United Kingdom    False
United States      True
Name: G7 Population in millions, dtype: bool

In [193]:
g7_pop[g7_pop > 80]

Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in millions, dtype: float64

In [194]:
g7_pop[(g7_pop > 80) | (g7_pop < 40)] 

Canada            35.467
Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in millions, dtype: float64

In [195]:
g7_pop[(g7_pop > 80) & (g7_pop < 200)] 

Germany     80.940
Japan      127.061
Name: G7 Population in millions, dtype: float64

# Modifying series

In [196]:
g7_pop['Canada'] = 40.5

In [197]:
g7_pop

Canada             40.500
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in millions, dtype: float64

In [198]:
g7_pop.iloc[-1] = 500

In [199]:
g7_pop  

Canada             40.500
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     500.000
Name: G7 Population in millions, dtype: float64

In [200]:
g7_pop[g7_pop < 70] = 99.99

In [201]:
g7_pop

Canada             99.990
France             99.990
Germany            80.940
Italy              99.990
Japan             127.061
United Kingdom     99.990
United States     500.000
Name: G7 Population in millions, dtype: float64