# Source: [Data Analysis with Python](https://www.freecodecamp.org/learn/data-analysis-with-python/)

# Importing Libraries

In [1]:
import pandas as pd
import numpy as np

# Pandas Series (Concept)

In [2]:
# Elements of a series is indexed

#Population of G7 in millions:
g7_pop = pd.Series([35.467, 63.951, 80.940, 60.665, 127.061, 64.511, 318.523]) #The Group of Seven: Canada, France, Germany, Italy, Japan, the UK, the USA
g7_pop

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
dtype: float64

In [3]:
# We can name serieses for better documentation

g7_pop.name = 'G7 Population in Millions'

In [4]:
g7_pop

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
Name: G7 Population in Millions, dtype: float64

In [5]:
g7_pop.dtype

dtype('float64')

In [6]:
g7_pop.values

array([ 35.467,  63.951,  80.94 ,  60.665, 127.061,  64.511, 318.523])

In [7]:
type(g7_pop.values)

numpy.ndarray

In [8]:
# Inexing works with Series

print(g7_pop)
print("first element: ",g7_pop[0])
print("second element: ", g7_pop[1])

0     35.467
1     63.951
2     80.940
3     60.665
4    127.061
5     64.511
6    318.523
Name: G7 Population in Millions, dtype: float64
first element:  35.467
second element:  63.951


In [9]:
#We can re-define the indexes in Pandas Series

g7_pop.index = [
    'Canada',
    'France',
    'Germany',
    'Italy',
    'Japan',
    'United Kingdom',
    'United States'
]

g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

# Creating a Series from Scratch

In [10]:
pd.Series({
    'Canada': 35.467,
    'France': 63.951,
    'Germany': 80.94,
    'Italy': 60.665,
    'Japan': 127.061,
    'United Kingdom': 64.511,
    'United States': 318.523
}, name= 'G7 Population in Millions')

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

In [11]:
pd.Series([35.467, 63.951,  80.94, 60.665, 127.061, 64.511, 318.523],
         index = ['Canada', 'France', 'Germany', 'Italy', 'Japan', 'united Kingdom', 'United States'],
         name = 'G7 Population in Millions')

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
united Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

In [12]:
# You can also create Series out of other Series, specifying indexes

pd.Series(g7_pop, index=['France', 'Germany', 'Italy', 'Spain'])

France     63.951
Germany    80.940
Italy      60.665
Spain         NaN
Name: G7 Population in Millions, dtype: float64

# Indexing

In [13]:
g7_pop['Canada']

35.467

In [14]:
g7_pop['Japan']

127.061

In [15]:
g7_pop.iloc[0]

35.467

In [16]:
g7_pop.iloc[-1]

318.523

In [17]:
g7_pop[['Italy','France']] # result will be a new Series

Italy     60.665
France    63.951
Name: G7 Population in Millions, dtype: float64

In [18]:
g7_pop.iloc[[0,1,2]]

Canada     35.467
France     63.951
Germany    80.940
Name: G7 Population in Millions, dtype: float64

In [19]:
# Series also support slicing but unlike Python, it INCLUDES the upper limit.

g7_pop['Canada':'Italy']

Canada     35.467
France     63.951
Germany    80.940
Italy      60.665
Name: G7 Population in Millions, dtype: float64

# Conditional Selection (Boolean Arrays)

In [20]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

In [21]:
g7_pop>70

Canada            False
France            False
Germany            True
Italy             False
Japan              True
United Kingdom    False
United States      True
Name: G7 Population in Millions, dtype: bool

In [22]:
g7_pop[g7_pop>70]

Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in Millions, dtype: float64

In [23]:
g7_pop.mean()

107.30257142857144

In [24]:
g7_pop[ g7_pop>g7_pop.mean()]

Japan            127.061
United States    318.523
Name: G7 Population in Millions, dtype: float64

In [25]:
g7_pop.std()

97.24996987121581

In [26]:
g7_pop[(g7_pop > g7_pop.mean() - g7_pop.std()) | (g7_pop > g7_pop.mean()  + g7_pop.std())]

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

# Operations & Methods

In [27]:
g7_pop + 100

Canada            135.467
France            163.951
Germany           180.940
Italy             160.665
Japan             227.061
United Kingdom    164.511
United States     418.523
Name: G7 Population in Millions, dtype: float64

In [28]:
g7_pop.mean()

107.30257142857144

In [29]:
np.log(g7_pop)

Canada            3.568603
France            4.158117
Germany           4.393708
Italy             4.105367
Japan             4.844667
United Kingdom    4.166836
United States     5.763695
Name: G7 Population in Millions, dtype: float64

In [30]:
g7_pop['France': 'Italy'].mean()

68.51866666666666

# Boolean Arrays

In [31]:
g7_pop

Canada             35.467
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

In [32]:
g7_pop > 80


Canada            False
France            False
Germany            True
Italy             False
Japan              True
United Kingdom    False
United States      True
Name: G7 Population in Millions, dtype: bool

In [33]:
g7_pop[g7_pop>80]

Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in Millions, dtype: float64

In [34]:
g7_pop[(g7_pop>80) | (g7_pop<40)]

Canada            35.467
Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in Millions, dtype: float64

In [35]:
g7_pop[(g7_pop>80) & (g7_pop<400)]

Germany           80.940
Japan            127.061
United States    318.523
Name: G7 Population in Millions, dtype: float64

# Modifying Series

In [36]:
g7_pop['Canada'] = 40.5

In [37]:
g7_pop

Canada             40.500
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     318.523
Name: G7 Population in Millions, dtype: float64

In [38]:
g7_pop.iloc[-1]= 500

In [39]:
g7_pop

Canada             40.500
France             63.951
Germany            80.940
Italy              60.665
Japan             127.061
United Kingdom     64.511
United States     500.000
Name: G7 Population in Millions, dtype: float64

In [40]:

g7_pop[g7_pop<70]=99.99

In [41]:
g7_pop

Canada             99.990
France             99.990
Germany            80.940
Italy              99.990
Japan             127.061
United Kingdom     99.990
United States     500.000
Name: G7 Population in Millions, dtype: float64