<a href="https://colab.research.google.com/github/WizardOfCodes442/Numpy-docs/blob/main/numpy_universal_func.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

In [17]:
#Computation on Numpy Arrays: Universal functions


#The slowness of loop
#for example, we have an array of valuoes and we'd like to
#compute the reciprocal of each
#A straightforward approach might look like this

%matplotlib inline
import matplotlib.pyplot as plt
import numpy as np
from scipy import special
import pandas as pd
np.random.seed(0)

def compute_reciprocals(values):
  output = np.empty(len(values))
  for i in range(len(values)):
    output[i] = 1.0 / values[i]
  return output
values = np.random.randint(1, 10, size=5)
compute_reciprocals(values)

#if we measure the excution time of this code for
#large input, we see that the operation is very slow
#we'll benchmark this with Ipython's %timeit magic

big_array = np.random.randint(1, 100, size=1000000)
%timeit compute_reciprocals(big_array)

#for many types of operations, Numpy provides  a
#convenient interface into just this kind of statically
#typed, compiled routine. This is known as vectorized operation.
#you can accomplish this by simply performing an operation on the array
#which will then be applied to each element

#This vectorized approach is designed to push the loop into
#the compiled layer that underlies NumPy, leading to much faster
#excution
print(compute_reciprocals(values))
print(1.0/values)

%timeit (1.0/big_array)

#Vectorized operations are implemented via ufuncs, whose main purpose
#is to quickly execute repeated operations on values in Numpy arrays.
#Ufuncs are extremely flexible

#we can operate between two arrays
np.arange(5)/ np.arange(1, 6)

#ufunc operation are not limited to one-dimensional arrays
#they can act on multi-dimensional arrays as wells

x = np.arange(9).reshape((3,3))
2 * x

#computation using vectorization through ufuncs are nearly always more
#effecient than their counterpart implemented through Pyhton loops, especially
#as the arrays groiw in size
#always consider replacing all loops in python scripts with
#vectorized expressions.

#Array arithmetic
x = np.arange(4)
print("x       =",  x)
print("x + 5  = ", x + 5)
print("x - 5 = "  ,x  - 5 )
print("x  *  2 = ",    x *  2 )
print("x / 2 = ", x / 2 )
print("x   //  2 =",  x //2)

#There is also a unary ufunc for negation, a ** operator for exponentiation
#and a % operator for modulus:
print("-x       =", -x )
print("x   ** 2 =",  x ** 2 )
print("x   %   2 ", x % 2)

#In addition, these arithmetic operations can be strung together however you wish,
#and the standard order of operation is respected
-(0.5*x + 1) ** 2

#all operations are simply convenient wrappers arround specific functions
#built into Numpy, for example, the _+ operator is a wrapper for add function

x = np.array([-2, -1, 0, 1, 2])
abs(x)
np.absolute(x)
np.abs(x)

#The ufunc function can also handle complex data, in which the absolute value
#returns the magnitude:

x = np.array([3 - 4j, 4 -3j, 2+ 0j, 0 + 1j])
np.abs(x)

#Trigonometric functions
#start by defining an arrays of angles:

theta = np.linspace(0, np.pi, 3)

#now we can compute some trigonometric functions on these values:
print("theta       =",  theta)
print("sin(theta)   = ", np.sin(theta))
print("cos(theta)  =  ", np.cos(theta))
print("tan(theta)    =   ",  np.tan(theta))

#Exponents and logarithms
x = [1, 2, 3]
print("x    = ", x)
print("e^x    =", np.exp(x))
print("2^x  =  ", np.exp2(x))
print("3^x    =   ", np.power(3, x))

#The inverse of the exponentials, the logarithms, are also available.
#The basic np.log gives the natuaral logarithm,
#base-2 and base-10 logarithms are available as well.

x = [1, 2,4, 10]
print("x     =",  x)
print("ln(x)         =", np.log(x))
print("log2(x)      ", np.log2(x))
print("log10(x)    =",  np.log10(x))

#some specialized versions that are useful for maintaining precision with
#with very small input:
x = [0, 0.001, 0.01, 0.1]
print("exp(x)  -1 =", np.expm1(x))
print("log(1+ x)= " , np.log1p(x))

#Specialized ufuncs
#Numpy has many more ufuncs available, including hyperbolic trig functions,
#bitwise arithmetic, comparison operators, conversions from radians to degree,
#rounding and remainders, and so much more.
#obscure methematical functions on your data, scipy.special

#gamma functions (generalized factorials ) and related functions
x = [1, 5, 10]
print("gamma(x)     =", special.gamma(x))
print("ln| gamma(x) |   ="  , special.gammaln(x))
print("beta(x, 2)  = ", special.beta(x,  2))

#Error function (integral of Gaussian)
#its complement, and its inverse
x = np.array([0, 0.3, 0.7, 1.0])
print("erf(x)    =", special.erf(x))
print("erfc(x)    =", special.erfc(x))
print("erfinv(x)  = ", special.erfcinv(x))

#Advanced Ufunc functions

#Specifying output
x = np.arange(5)
y = np.empty(5)
np.multiply(x, 10, out=y)

#This can be used with array view. we can write the result of a computation
#to every other element of a specified array :
y = np.zeros(10)
np.power(2, x, out=y[::2])
print(y)

#Aggregates
x = np.arange(1, 6)
np.add.reduce(x)

#similarly , calling reduce on the multiply ufunc results in the product
#of all the array elements
np.multiply.reduce(x)

#If we'd like to store all the intermediate result in a computation
#we can instead use accumulate
np.add.accumulate(x)
np.multiply.accumulate(x)

#outer Products
#ufuncs can compute the output of all pairs of two diffrent inputs using
#the outer method.
#This allows you, ..

x = np.arange(1, 6)
np.multiply.outer(x, x)

#Aggregations: Min, Max and eerything between
#summing value in an array
L = np.random.random(100)
sum(L)
np.sum(L)

big_array = np.random.rand(1000000)
%timeit sum(big_array)
%timeit np.sum(big_array)

#similarly
min(big_array)
max(big_array)
np.min(big_array)
np.max(big_array)

#Multidimensional aggregates
M = np.random.random((3, 4))
print(M)
M.sum()
M.min(axis = 0)
M.max(axis = 1)

#Example what's the average height of the US president
data = pd.read_csv('data/president_heights.csv')
heights = np.array(data['height(cm)'])
print(heights)

print("Mean height:       ", heights.mean())
print("Standard deviation:", heights.std())
print("Minimum height:    ", heights.min())
print("Maximum height:    ", heights.max())
print("25th percentile:   ", np.percentile(heights, 25))
print("Median:            ", np.median(heights))
print("75th percentile:   ", np.percentile(heights, 75))

plt.hist(heights)
plt.title('heights Distribution of Us Presidents ')
plt.xlabel('height (cm)')
plt.ylabel('number')
plt.show()

2.08 s ± 509 ms per loop (mean ± std. dev. of 7 runs, 1 loop each)
[0.16666667 1.         0.25       0.25       0.125     ]
[0.16666667 1.         0.25       0.25       0.125     ]
2.1 ms ± 305 µs per loop (mean ± std. dev. of 7 runs, 1000 loops each)
x       = [0 1 2 3]
x + 5  =  [5 6 7 8]
x - 5 =  [-5 -4 -3 -2]
x  *  2 =  [0 2 4 6]
x / 2 =  [0.  0.5 1.  1.5]
x   //  2 = [0 0 1 1]
-x       = [ 0 -1 -2 -3]
x   ** 2 = [0 1 4 9]
x   %   2  [0 1 0 1]
theta       = [0.         1.57079633 3.14159265]
sin(theta)   =  [0.0000000e+00 1.0000000e+00 1.2246468e-16]
cos(theta)  =   [ 1.000000e+00  6.123234e-17 -1.000000e+00]
tan(theta)    =    [ 0.00000000e+00  1.63312394e+16 -1.22464680e-16]
x    =  [1, 2, 3]
e^x    = [ 2.71828183  7.3890561  20.08553692]
2^x  =   [2. 4. 8.]
3^x    =    [ 3  9 27]
x     = [1, 2, 4, 10]
ln(x)         = [0.         0.69314718 1.38629436 2.30258509]
log2(x)       [0.         1.         2.         3.32192809]
log10(x)    = [0.         0.30103    0.60205999 1.        

FileNotFoundError: [Errno 2] No such file or directory: 'data/president_heights.csv'