### Pandas - Aggregate

In [1]:
import pandas as pd
import numpy as np

In [3]:
array = np.random.randint(10,30,size = (5,4))
df = pd.DataFrame(array, columns = list("ABCD"))
df

Unnamed: 0,A,B,C,D
0,26,26,16,15
1,25,17,17,10
2,28,24,24,24
3,14,19,18,28
4,10,10,29,25


In [4]:
df.describe()

Unnamed: 0,A,B,C,D
count,5.0,5.0,5.0,5.0
mean,20.6,19.2,20.8,20.4
std,8.049845,6.300794,5.540758,7.569676
min,10.0,10.0,16.0,10.0
25%,14.0,17.0,17.0,15.0
50%,25.0,19.0,18.0,24.0
75%,26.0,24.0,24.0,25.0
max,28.0,26.0,29.0,28.0


In [5]:
df["A"].mean()

20.6

In [7]:
df["A"].var()

64.8

In [8]:
df["A"].std()

8.049844718999243

In [10]:
df.aggregate(np.mean)

A    20.6
B    19.2
C    20.8
D    20.4
dtype: float64

In [12]:
df.mean()

A    20.6
B    19.2
C    20.8
D    20.4
dtype: float64

In [14]:
df.agg(np.mean)

A    20.6
B    19.2
C    20.8
D    20.4
dtype: float64

In [17]:
df.apply(np.mean)

A    20.6
B    19.2
C    20.8
D    20.4
dtype: float64

In [19]:
df.aggregate(np.max)

A    28
B    26
C    29
D    28
dtype: int32

In [21]:
df.aggregate([np.max])

Unnamed: 0,A,B,C,D
amax,28,26,29,28


In [23]:
df.aggregate([np.mean])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4


In [25]:
df.aggregate([np.mean, np.min])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0


In [27]:
df.aggregate([np.mean, np.min, np.std])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0
std,8.049845,6.300794,5.540758,7.569676


In [29]:
df.aggregate([np.mean, np.min, np.std, np.var])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3


In [31]:
df.aggregate([np.mean, np.min, np.std, np.var, min, max])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3
min,10.0,10.0,16.0,10.0
max,28.0,26.0,29.0,28.0


In [33]:
df.aggregate([np.mean, np.min, np.std, np.var, min, max, sum])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3
min,10.0,10.0,16.0,10.0
max,28.0,26.0,29.0,28.0
sum,103.0,96.0,104.0,102.0


In [34]:
df.aggregate([np.mean, np.min, np.std, np.var, min, max, sum])

Unnamed: 0,A,B,C,D
mean,20.6,19.2,20.8,20.4
amin,10.0,10.0,16.0,10.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3
min,10.0,10.0,16.0,10.0
max,28.0,26.0,29.0,28.0
sum,103.0,96.0,104.0,102.0


In [36]:
df.aggregate([min, max, sum])

Unnamed: 0,A,B,C,D
min,10,10,16,10
max,28,26,29,28
sum,103,96,104,102


In [42]:
df.aggregate([min, max, sum, 'std','var', 'median'])

Unnamed: 0,A,B,C,D
min,10.0,10.0,16.0,10.0
max,28.0,26.0,29.0,28.0
sum,103.0,96.0,104.0,102.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3
median,25.0,19.0,18.0,24.0


In [43]:
df.aggregate(['min', 'max', 'sum', 'std','var', 'median'])

Unnamed: 0,A,B,C,D
min,10.0,10.0,16.0,10.0
max,28.0,26.0,29.0,28.0
sum,103.0,96.0,104.0,102.0
std,8.049845,6.300794,5.540758,7.569676
var,64.8,39.7,30.7,57.3
median,25.0,19.0,18.0,24.0


In [45]:
df['B'].aggregate(['min', 'max', 'sum', 'std','var', 'median'])

min       10.000000
max       26.000000
sum       96.000000
std        6.300794
var       39.700000
median    19.000000
Name: B, dtype: float64

In [46]:
df[['B','D']].aggregate(['min', 'max', 'sum', 'std','var', 'median'])

Unnamed: 0,B,D
min,10.0,10.0
max,26.0,28.0
sum,96.0,102.0
std,6.300794,7.569676
var,39.7,57.3
median,19.0,24.0


In [48]:
df

Unnamed: 0,A,B,C,D
0,26,26,16,15
1,25,17,17,10
2,28,24,24,24
3,14,19,18,28
4,10,10,29,25


In [50]:
df.iloc[1,2] = 'python'
df

Unnamed: 0,A,B,C,D
0,26,26,16,15
1,25,17,python,10
2,28,24,24,24
3,14,19,18,28
4,10,10,29,25


In [52]:
df.aggregate(['min', 'max', 'sum', 'std','var', 'median'])

  df.aggregate(['min', 'max', 'sum', 'std','var', 'median'])


Unnamed: 0,A,B,D
min,10.0,10.0,10.0
max,28.0,26.0,28.0
sum,103.0,96.0,102.0
std,8.049845,6.300794,7.569676
var,64.8,39.7,57.3
median,25.0,19.0,24.0


In [55]:
df.select_dtypes(include=[int,float]).aggregate(['min', 'max', 'sum', 'std','var', 'median'])

Unnamed: 0,A,B,D
min,10.0,10.0,10.0
max,28.0,26.0,28.0
sum,103.0,96.0,102.0
std,8.049845,6.300794,7.569676
var,64.8,39.7,57.3
median,25.0,19.0,24.0
