### NUMPY STATISTICS
- Compute the median of the flattened NumPy array

In [1]:
import numpy as np

In [2]:
arr = np.array([3, 4, 5, 8, 11, 22, 34])
med = np.median(arr)

print('The median of %s is %s'%(arr, med))

The median of [ 3  4  5  8 11 22 34] is 8.0


- Find Mean of a List of Numpy Array

In [3]:
arr1 = np.array([3, 4, 6, 9])
arr2 = np.array([1, 2, 4, 5])
arr3 = np.array([5, 7, 8, 10])

list_ = [arr1, arr2, arr3]

means = [np.mean(i) for i in list_]

print('List of arrays: %s'%list_)
print('Respective mean values: %s'%means)

List of arrays: [array([3, 4, 6, 9]), array([1, 2, 4, 5]), array([ 5,  7,  8, 10])]
Respective mean values: [5.5, 3.0, 7.5]


- Calculate the mean of array ignoring the NaN value

In [4]:
arr = np.array([1, 3, 4, np.nan, 2, 4])

mean = np.nanmean(arr)

print('Array with nan in it: %s'%arr)
print('Mean of the array: %s'%mean)

Array with nan in it: [ 1.  3.  4. nan  2.  4.]
Mean of the array: 2.8


- Get the mean value from given matrix

In [5]:
arr = np.array([[1, 2, 3],
                [5, 6, 8],
                [9, 10, 22]])

mean = np.mean(arr)

print('The mean of the matrix:\n%s\n\nis %s'%(arr, mean))

The mean of the matrix:
[[ 1  2  3]
 [ 5  6  8]
 [ 9 10 22]]

is 7.333333333333333


- Compute the variance of the NumPy array

In [6]:
arr = np.array([3, 5, 7, 9, 11, 13, 17])

variance = np.var(arr)

print('The variance of %s is %s'%(arr, variance))

The variance of [ 3  5  7  9 11 13 17] is 19.918367346938773


- Compute the standard deviation of the NumPy array

In [7]:
arr = np.array([1, 3, 11, 14, 21, 32, 51])

std = np.std(arr)

print('The standard deviation of %s is %s'%(arr, std))

The standard deviation of [ 1  3 11 14 21 32 51] is 16.327015298927986


- Compute pearson product-moment correlation coefficients of two given NumPy arrays

In [8]:
arr1 = np.array([3, 5, 7, 9, 11, 13, 17])
arr2 = np.array([1, 3, 11, 14, 21, 32, 51])

corr_coef = np.corrcoef(arr1, arr2)

print('A =%s\n\nB =%s\n'%(arr1, arr2))
print('Correlation coefficients of A and B:\n%s'%corr_coef)

A =[ 3  5  7  9 11 13 17]

B =[ 1  3 11 14 21 32 51]

Correlation coefficients of A and B:
[[1.         0.98025326]
 [0.98025326 1.        ]]


- Calculate the mean across dimension in a 2D NumPy array

In [9]:
arr = np.array([[3, 5, 7],
                [9, 8 ,4],
                [2, 6, 9],
                [0, 0, 4]])

row_means = np.mean(arr, axis=1)
col_means = np.mean(arr, axis=0)

print('Array:\n%s\n'%arr)
print('Row means: %s\n'%row_means)
print('Column means: %s\n'%col_means)

Array:
[[3 5 7]
 [9 8 4]
 [2 6 9]
 [0 0 4]]

Row means: [5.         7.         5.66666667 1.33333333]

Column means: [3.5  4.75 6.  ]



- Calculate the average, variance and standard deviation in Python using NumPy

In [10]:
arr = np.array([1, 3, 11, 14, 21, 32, 51])

avg = np.average(arr)
variance = np.var(arr)
std = np.std(arr)

print('The array %s has\n ° average = %s\n ° variance = %s\n ° standard deviation = %s'%(arr, avg, variance, std))

The array [ 1  3 11 14 21 32 51] has
 ° average = 19.0
 ° variance = 266.57142857142856
 ° standard deviation = 16.327015298927986


- Describe a NumPy Array in Python

In [11]:
def describe(arr):
    labels = ['shape', 'mean', 'median', 'standard deviation',
              'average', 'variance', 'min', '25%', '50%', '75%',
              'max', 'range']
    values = [arr.shape,
              np.mean(arr), 
              np.median(arr),
              np.std(arr),
              np.average(arr),
              np.var(arr),
              np.min(arr),
              np.percentile(arr, 25), np.percentile(arr, 50), np.percentile(arr, 75),
              np.max(arr),
              np.ptp(arr)]
    
    print('Description of the array: %s'%arr)
    for key, val in zip(labels, values):
        print(' ° %s = %s'%(key, val))
        

arr = np.array([3, 5, 7, 9, 11, 13, 17])
describe(arr)

Description of the array: [ 3  5  7  9 11 13 17]
 ° shape = (7,)
 ° mean = 9.285714285714286
 ° median = 9.0
 ° standard deviation = 4.462999814803802
 ° average = 9.285714285714286
 ° variance = 19.918367346938773
 ° min = 3
 ° 25% = 6.0
 ° 50% = 9.0
 ° 75% = 12.0
 ° max = 17
 ° range = 14
