<p style="font-family: Arial; font-size:3.75em;color:purple; font-style:bold"><br>
Introduction to numpy:
</p><br>

<p style="font-family: Arial; font-size:1.25em;color:#2462C0; font-style:bold"><br>
Package for scientific computing with Python
</p><br><br>

<p style="font-family: Arial; font-size:2.75em;color:purple; font-style:bold"><br>

ndarray<br><br></p>

<p style="font-family: Arial; font-size:1.25em;color:#2462C0; font-style:bold"><br>
Time and space-efficient multidimensional arrays:

</p>

In [2]:
import numpy as np

an_array = np.array([3, 33, 333])  # Create a rank 1 array

print(type(an_array))              # Prints "<class 'numpy.ndarray'>"

print(an_array.shape)

print(an_array[0], an_array[1], an_array[2])

an_array[0] = 888                 # Change an element of the array

print(an_array)

<class 'numpy.ndarray'>
(3,)
3 33 333
[888  33 333]


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

How to create a Rank 2 numpy array:</p>

In [47]:
another = np.array([[11,12,13],[21,22,23]])   # Create a rank 2 array

print(another.shape)  # rows x columns                   

print(another[0, 0], another[0, 1], another[1, 0])

(2, 3)
11 12 21


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

There are many way to create numpy arrays:
</p>

In [91]:
import numpy as np

ex1 = np.zeros((2,2))      #   an array of zeros
print(ex1)             

print() 
ex2 = np.full((2,2), 9.0)  #   an array filled with 9.0
print(ex2)              

print()
ex3 = np.eye(2)            #   a 2x2  matrix
print(ex3)  

print() 
ex4 = np.ones((1,2))       #   an array of ones
print(ex4)              

print()
ex5 = np.random.random((2,2)) # an array of random values
print(ex5)                     

[[ 0.  0.]
 [ 0.  0.]]

[[ 9.  9.]
 [ 9.  9.]]

[[ 1.  0.]
 [ 0.  1.]]

[[ 1.  1.]]

[[ 0.85755874  0.59682324]
 [ 0.12201789  0.08788861]]


<p style="font-family: Arial; font-size:2.75em;color:purple; font-style:bold"><br>

Array Indexing
<br><br></p>

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Slice indexing:
</p>

In [89]:
import numpy as np

# Rank 2 array of shape (3, 4)
an_array = np.array([[11,12,13,14], [21,22,23,24], [31,32,33,34]])
print(an_array)
print()

# Array slicing: get a subarray consisting of the first 2 rows x 2 columns

a_slice = an_array[:2, 1:3]
print(a_slice)
print()

# When you modify a slice, you modify the underlying array

print(an_array[0, 1])    
a_slice[0, 0] = 1000    # a_slice[0, 0] is the same piece of data as an_array[0, 1]
print(an_array[0, 1])    

[[11 12 13 14]
 [21 22 23 24]
 [31 32 33 34]]

[[12 13]
 [22 23]]

12
1000


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Use both integer indexing & slice indexing
</p>

In [88]:
import numpy as np

# Rank 2 array of shape (3, 4)

an_array = np.array([[11,12,13,14], [21,22,23,24], [31,32,33,34]])
print(an_array)
print()

# Using both integer indexing & slicing generates an array of lower rank
row_rank1 = an_array[1, :]    # Rank 1 view 

# Slicing alone: generates an array of the same rank as the an_array
row_rank2 = an_array[1:2, :]  # Rank 2 view 

print(row_rank1, row_rank1.shape)   
print()
print(row_rank2, row_rank2.shape)   # Notice the [[ ]]

[[11 12 13 14]
 [21 22 23 24]
 [31 32 33 34]]

[21 22 23 24] (4,)

[[21 22 23 24]] (1, 4)


In [87]:
# For columns of an array:

print()
col_rank1 = an_array[:, 1]
col_rank2 = an_array[:, 1:2]

print(col_rank1, col_rank1.shape)  # Rank 1
print()
print(col_rank2, col_rank2.shape)  # Rank 2


[12 22 32] (3,)

[[12]
 [22]
 [32]] (3, 1)


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Array Indexing for changing elements:
</p>

In [17]:
# Create a new array
an_array = np.array([[11,12,13], [21,22,23], [31,32,33], [41,42,43]])

print('Original Array:')
print(an_array)

# Create an array of indices
indices = np.array([0, 1, 2, 0])

whichRows = np.arange(4)
print('\nRows indices picked : %s' % whichRows)

# Select one element from each row
print(an_array[whichRows, indices])

# Change one element from each row
an_array[np.arange(4), indices] += 100000

print('\nChanged Array:')
print(an_array)

Original Array:
[[11 12 13]
 [21 22 23]
 [31 32 33]
 [41 42 43]]

Rows indices picked : [0 1 2 3]
[11 22 33 41]

Changed Array:
[[100011     12     13]
 [    21 100022     23]
 [    31     32 100033]
 [100041     42     43]]


In [22]:
an_array = np.array([[11,12], [21, 22], [31, 32]])

In [23]:
filter = (an_array > 15)
filter

array([[False, False],
       [ True,  True],
       [ True,  True]], dtype=bool)

In [24]:
print(an_array[filter])

[21 22 31 32]


In [25]:
#Can be done this way also:

an_array[an_array > 15]

array([21, 22, 31, 32])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Datatypes:
</p>

In [27]:
ex1 = np.array([11, 12]) # Python assigns the  data type
print(ex1.dtype)

ex2 = np.array([11.0, 12.0]) # Python assigns the  data type
print(ex2.dtype)

ex3 = np.array([11, 21], dtype=np.int64) #You can also tell Python the  data type
print(ex3.dtype)

int64
float64
int64


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Array Operations:

</p>

In [10]:
x = np.array([[111,112],[121,122]], dtype=np.int)
y = np.array([[211.1,212.1],[221.1,222.1]], dtype=np.float64)

print(x + y)
print(np.add(x, y))

[[ 322.1  324.1]
 [ 342.1  344.1]]
[[ 322.1  324.1]
 [ 342.1  344.1]]


In [11]:
print(x - y)
print(np.subtract(x, y))

[[-100.1 -100.1]
 [-100.1 -100.1]]
[[-100.1 -100.1]
 [-100.1 -100.1]]


In [12]:
print(x * y)
print(np.multiply(x, y))

[[ 23432.1  23755.2]
 [ 26753.1  27096.2]]
[[ 23432.1  23755.2]
 [ 26753.1  27096.2]]


In [13]:
print(x / y)
print(np.divide(x, y))

[[ 0.52581715  0.52805281]
 [ 0.54726368  0.54930212]]
[[ 0.52581715  0.52805281]
 [ 0.54726368  0.54930212]]


In [14]:
print(np.sqrt(x))

[[ 10.53565375  10.58300524]
 [ 11.          11.04536102]]


In [15]:
print(np.exp(x))

[[  1.60948707e+48   4.37503945e+48]
 [  3.54513118e+52   9.63666567e+52]]


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Elementwise Operations:

</p>

In [70]:
x2d = np.array([[1,1],[1,1]])
y2d = np.array([[2,2],[2,2]])

print(x2d.dot(y2d))
print()
print(np.dot(x2d, y2d))

[[4 4]
 [4 4]]

[[4 4]
 [4 4]]


In [69]:
a1d = np.array([9 , 9 ])
b1d = np.array([10, 10])

print(a1d.dot(b1d))
print()
print(np.dot(a1d, b1d))

180

180


In [67]:
print(x2d.dot(a1d))
print()
print(np.dot(x2d, a1d))

[18 18]

[18 18]


<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Sum / Transpose:

</p>

In [73]:
ex1 = np.array([[11,12],[21,22]])

print(np.sum(ex1))          # add all members
print()

print(np.sum(ex1, axis=0))  # columnwise sum
print()

print(np.sum(ex1, axis=1))  # rowwise sum
print()

66

[32 34]

[23 43]



<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Binary functions:</p>

In [21]:
x = np.random.randn(8)
x

array([-0.67145205, -1.81409443,  0.59756126, -0.46254935, -0.33429261,
       -2.53156261, -0.31325366,  0.36980675])

In [22]:
y = np.random.randn(8)
y

array([-0.0186239 ,  0.16471443,  1.03041402, -1.11559348,  0.08490375,
       -0.86993466, -0.3468221 ,  0.58119532])

In [24]:
# returns element wise maximum between two arrays

np.maximum(x, y)

array([-0.0186239 ,  0.16471443,  1.03041402, -0.46254935,  0.08490375,
       -0.86993466, -0.31325366,  0.58119532])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Reshaping array:
</p>

In [6]:
arr = np.arange(20)
print(arr)

[ 0  1  2  3  4  5  6  7  8  9 10 11 12 13 14 15 16 17 18 19]


In [8]:
arr.reshape(4,5)

array([[ 0,  1,  2,  3,  4],
       [ 5,  6,  7,  8,  9],
       [10, 11, 12, 13, 14],
       [15, 16, 17, 18, 19]])

In [74]:
ex1.T

array([[11, 21],
       [12, 22]])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Indexing using where():</p>

In [29]:
x_1 = np.array([1,2,3,4,5])

y_1 = np.array([11,22,33,44,55])

filter = np.array([True, False, True, False, True])

In [30]:
out = np.where(filter, x_1, y_1)
print(out)

[ 1 22  3 44  5]


In [32]:
mat = np.random.rand(5,5)
mat

array([[ 0.50650363,  0.70000205,  0.28258421,  0.3453008 ,  0.37620082],
       [ 0.61688835,  0.27297373,  0.0810489 ,  0.59313101,  0.00393335],
       [ 0.11567232,  0.8329555 ,  0.74163426,  0.67805647,  0.11842672],
       [ 0.31958085,  0.55013339,  0.29659014,  0.01627146,  0.20713639],
       [ 0.74352591,  0.42933545,  0.80201787,  0.55404236,  0.32366983]])

In [35]:
np.where( mat > 0.5, 1000, -1)

array([[1000, 1000,   -1,   -1,   -1],
       [1000,   -1,   -1, 1000,   -1],
       [  -1, 1000, 1000, 1000,   -1],
       [  -1, 1000,   -1,   -1,   -1],
       [1000,   -1, 1000, 1000,   -1]])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

any or all conditionals:</p>

In [73]:
arr_bools = np.array([ True, False, True, True, False ])

In [74]:
arr_bools.any()

True

In [75]:
arr_bools.all()

False

<p style="font-family: Arial; font-size:2.75em;color:purple; font-style:bold"><br>

Broadcasting:
<br><br>
</p>

In [3]:
start   = np.array([
                    [11,12,13], 
                    [21*10,22*10,23*10], 
                    [31*100,32*100,33*100], 
                    [41*1000,42*1000,43*1000]
                   ])
print(start)
print()

addThis = np.array([1, 0, 1])
print(addThis)
print()

y = start + addThis  # add to each row of 'start' using broadcasting
print(y)

[[   11    12    13]
 [  210   220   230]
 [ 3100  3200  3300]
 [41000 42000 43000]]

[1 0 1]

[[   12    12    14]
 [  211   220   231]
 [ 3101  3200  3301]
 [41001 42000 43001]]


<p style="font-family: Arial; font-size:2.75em;color:purple; font-style:bold"><br>

Statistical Methods:
<br><br>
</p>

In [64]:
arry = 10 * np.random.randn(2,4)
arry

array([[ -5.96655254,  -8.64245691,  33.6189757 ,  -5.64851025],
       [ -5.1726027 ,  -2.05570427,  -2.98207292,  18.45786079]])

In [65]:
arry.mean()

2.7011171143006116

In [66]:
arry.mean(axis = 1)

array([ 3.340364  ,  2.06187023])

In [67]:
arry.mean(axis = 0)

array([ -5.56957762,  -5.34908059,  15.31845139,   6.40467527])

In [68]:
arry.sum()

21.608936914404893

<p style="font-family: Arial; font-size:2.75em;color:purple; font-style:bold"><br>

Sorting:
<br><br>
</p>

In [81]:
unsorted = np.random.randn(10)
unsorted

array([ 1.27490797,  0.51640029,  1.09288062, -0.53483185, -1.5827483 ,
        0.94011922, -2.54468739, -0.22917393,  0.40715973,  0.1622559 ])

In [86]:
unsorted.sort() #inplace sorting
unsorted

array([-2.54468739, -1.5827483 , -0.53483185, -0.22917393,  0.1622559 ,
        0.40715973,  0.51640029,  0.94011922,  1.09288062,  1.27490797])

In [90]:
# Bonus: Find how many unique values are there in the array:
np.unique(unsorted)

array([-2.54468739, -1.5827483 , -0.53483185, -0.22917393,  0.1622559 ,
        0.40715973,  0.51640029,  0.94011922,  1.09288062,  1.27490797])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Set Operations with np.array data type:
</p>

In [45]:
s1 = np.array(['desk','chair','bulb'])
s2 = np.array(['lamp','bulb','chair'])

In [46]:
print(s1, s2)

['desk' 'chair' 'bulb'] ['lamp' 'bulb' 'chair']


In [47]:
np.intersect1d(s1, s2)

array(['bulb', 'chair'], 
      dtype='<U5')

In [48]:
np.union1d(s1, s2)

array(['bulb', 'chair', 'desk', 'lamp'], 
      dtype='<U5')

In [49]:
np.setdiff1d(s1, s2) # elements in s1 that are not in s2

array(['desk'], 
      dtype='<U5')

In [51]:
np.in1d(s1, s2) #which element of s1 is also in s2

array([False,  True,  True], dtype=bool)

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Read or Write to Disk:</p>

<p style="font-family: Arial; font-size:1.3em;color:#2462C0; font-style:bold"><br>

Binary Format:</p>

In [65]:
x = np.array([ 23.23, 24.24] )

In [66]:
np.save('an_array', x)

In [67]:
np.load('an_array.npy')

array([ 23.23,  24.24])

<p style="font-family: Arial; font-size:1.3em;color:#2462C0; font-style:bold"><br>

Text Format:</p>

In [70]:
np.savetxt('array.txt', X=x, delimiter=',')

In [71]:
!cat array.txt

2.323000000000000043e+01
2.423999999999999844e+01


In [72]:
np.loadtxt('array.txt', delimiter=',')

array([ 23.23,  24.24])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Random Number Generation:
</p>

In [88]:
Y = np.random.normal(size = (1,5))[0]
print(Y)

[ 0.02076939  0.96679143  1.19306778  0.44350976 -1.11748734]


In [100]:
Z = np.random.randint(low=2,high=50,size=4)
print(Z)

[26 41 25 23]


In [108]:
np.random.permutation(Z) #return a new ordering of elements in Z

array([41, 25, 23, 26])

In [109]:
np.random.uniform(size=4) #uniform distribution

array([ 0.35821386,  0.82869891,  0.08264538,  0.94053761])

In [110]:
np.random.normal(size=4) #normal distribution

array([-1.51347569, -0.08027449, -1.21703868,  0.62055987])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

Merging data sets:
</p>

In [124]:
K = np.random.randint(low=2,high=50,size=(2,2))
print(K)

print()
M = np.random.randint(low=2,high=50,size=(2,2))
print(M)

[[27 11]
 [ 4  5]]

[[ 3 32]
 [21 13]]


In [125]:
np.vstack((K,M))

array([[27, 11],
       [ 4,  5],
       [ 3, 32],
       [21, 13]])

In [126]:
np.hstack((K,M))

array([[27, 11,  3, 32],
       [ 4,  5, 21, 13]])

In [127]:
np.concatenate([K, M], axis = 0)

array([[27, 11],
       [ 4,  5],
       [ 3, 32],
       [21, 13]])

In [128]:
np.concatenate([K, M.T], axis = 1)

array([[27, 11,  3, 21],
       [ 4,  5, 32, 13]])

<p style="font-family: Arial; font-size:1.75em;color:#2462C0; font-style:bold"><br>

numpy documentation: </p>

https://docs.scipy.org/doc/numpy/reference/