# NumPy

In [22]:
import numpy as np
import sys

### Numpy is a multi dimentional array library. 

We use numpy over lists is that NumPy is very fast. Because NumPy uses fixed types.

We can choose data  type: int32, int16, float 64

Int in lists requires a lot more space than NumPy i.e. Size (8 Bytes), Reference Count(4 Bytes), Object Type(8 Bytes), Object Value(8 Bytes)

* When we are itirating over a NumPy array we don't have to do type check.

* NumPy is faster to read -> less bytes of memory.

* Uses Contiguous Memory

![Screenshot%20%282228%29.png](attachment:Screenshot%20%282228%29.png)
![Screenshot%20%282229%29.png](attachment:Screenshot%20%282229%29.png)
![Screenshot%20%282230%29.png](attachment:Screenshot%20%282230%29.png)
![Screenshot%20%282232%29.png](attachment:Screenshot%20%282232%29.png)

## Basics

In [23]:
a = np.array([1, 2, 3])
print(a)

[1 2 3]


In [24]:
b = np.array([[1.3, 4.6], [5.5, 9.1]], dtype="float64")
print(b)

[[1.3 4.6]
 [5.5 9.1]]


In [25]:
# Get Dimensions
a.ndim

1

In [26]:
b.ndim

2

In [27]:
# Shape
print(a.shape)
print(b.shape)

(3,)
(2, 2)


In [28]:
# Memory taken by NumPy Array and Type
print(b.dtype)
print(b.itemsize)
print(b.size)
print(b.nbytes)

float64
8
4
32


## Accessing / Changing particular elements

In [29]:
a = np.array([[1, 2, 3, 4, 5], [6, 7, 8, 9, 10]])
print(a)

[[ 1  2  3  4  5]
 [ 6  7  8  9 10]]


In [30]:
# Get a specific elemet [row, col]
print(a[1,4])
print(a[-1,-1])

10
10


In [31]:
# Get a specific row or column
print(a[1,:])

[ 6  7  8  9 10]


In [32]:
# [start_index: end_index: step_size]
print(a[0, 0: 5: 2 ])

[1 3 5]


In [33]:
# Changing a particular element
a[-1,-1] = 20
print(a)

[[ 1  2  3  4  5]
 [ 6  7  8  9 20]]


In [34]:
# Change all row / column
a[0,:] = 5
a[1,:] = 99
print(a)

[[ 5  5  5  5  5]
 [99 99 99 99 99]]


### 3D Example

In [35]:
d = np.array([[[1, 2],[3, 4]]])
print(d.ndim)

3


In [36]:
print(d[-1,-1,-1])

4


In [37]:
b = np.array([[[1,2],[3,4]],[[5,6],[7,8]]])
print(b)

[[[1 2]
  [3 4]]

 [[5 6]
  [7 8]]]


In [38]:
# Get 7
print(b[1, 1, 0])

7


In [39]:
# Replace
b[1,:,:] = [99, 88]
print(b)

[[[ 1  2]
  [ 3  4]]

 [[99 88]
  [99 88]]]


## Initialising Different Types of Arrays

In [40]:
# All Zeros Matrix
print(np.zeros(5), end= "\n\n")
print(np.zeros(5), end= "\n\n")
print(np.zeros((2,2)), end= "\n\n")
#print(np.zeros((3,3,3,3)), end= "\n\n")

[0. 0. 0. 0. 0.]

[0. 0. 0. 0. 0.]

[[0. 0.]
 [0. 0.]]



In [41]:
# All ones matrix
print(np.ones((3,3), dtype="float64")) # int32, int16,int8

[[1. 1. 1.]
 [1. 1. 1.]
 [1. 1. 1.]]


In [43]:
# Any other number (full_like and full) like some other np array_
c = np.full_like(a, 4)
print(c)
print("")
d = np.full(a.shape, 99)
print(d)

[[4 4 4 4 4]
 [4 4 4 4 4]]

[[99 99 99 99 99]
 [99 99 99 99 99]]


In [80]:
# Random decimal numbers matrix
np.random.seed(1) 
r = np.random.rand(2,2)
print(r)

[[4.17022005e-01 7.20324493e-01]
 [1.14374817e-04 3.02332573e-01]]


In [88]:
# Random integer values
r_i = np.random.randint(4, 9, size=(3,3))
print(r_i)

r_i = np.random.randint(300, size=(3,3))
print(r_i)

r_i = np.random.randint(200,300, size=(3,3))
print(r_i)

[[4 7 8]
 [7 8 8]
 [8 5 4]]
[[210  96 269]
 [ 10 279 152]
 [202 148 140]]
[[265 294 260]
 [224 282 297]
 [202 292 298]]


In [90]:
# Identity Matrix
I = np.identity(5, dtype="int8")
print(I)

[[1 0 0 0 0]
 [0 1 0 0 0]
 [0 0 1 0 0]
 [0 0 0 1 0]
 [0 0 0 0 1]]


In [99]:
arr = np.array([[1,2,3]])
print(arr)
# Repeat
r1 = np.repeat(arr, 3, axis = 1)
print(r1)
print("")
r1 = np.repeat(arr, 3, axis = 0)
print(r1)

[[1 2 3]]
[[1 1 1 2 2 2 3 3 3]]

[[1 2 3]
 [1 2 3]
 [1 2 3]]


#### Question
Build this:

[[1   1   1   1   1]

[ 1   0   0   0   1]


[ 1   0   9   0   1]


[ 1   0   0   0   1]


[ 1   1   1   1   1]]

In [104]:
a = np.ones((5,5), dtype="int32")
print(a)

[[1 1 1 1 1]
 [1 1 1 1 1]
 [1 1 1 1 1]
 [1 1 1 1 1]
 [1 1 1 1 1]]


In [105]:
a[1:4,1:4] = 0
print(a)

[[1 1 1 1 1]
 [1 0 0 0 1]
 [1 0 0 0 1]
 [1 0 0 0 1]
 [1 1 1 1 1]]


In [106]:
a[2,2] = 9
print(a)

[[1 1 1 1 1]
 [1 0 0 0 1]
 [1 0 9 0 1]
 [1 0 0 0 1]
 [1 1 1 1 1]]


### Copying Arrays ---> Be careful (Copy by value and reference)

In [109]:
a = np.array([1, 2, 3])
b = a
b[0] = 100
print(b)
print(a)
# We are referencing the same here

[100   2   3]
[100   2   3]


In [111]:
# We have to use .copy()
a = np.array([1, 2, 3])
b = a.copy()
b[0] = 100
print("b : ", b)
print("a : ",a)

b :  [100   2   3]
a :  [1 2 3]


## Mathematics

In [131]:
a = np.array([[1, 2, 3, 4, 5], [7, 8, 9, 10, 11]])
print(a)

[[ 1  2  3  4  5]
 [ 7  8  9 10 11]]


In [119]:
print(a/2)

[[0.5 1.  1.5 2.  2.5]
 [3.5 4.  4.5 5.  5.5]]


In [114]:
print(a * 2)

[[ 2  4  6  8 10]
 [14 16 18 20 22]]


In [115]:
print(a**2)

[[  1   4   9  16  25]
 [ 49  64  81 100 121]]


In [135]:
a = np.array([[1, 2, 3, 4, 5], [7, 8, 9, 10, 11]])
a += 2
print(a)

[[ 3  4  5  6  7]
 [ 9 10 11 12 13]]


In [137]:
# Take sin()
b = np.cos(a)
print(b)

[[-0.9899925  -0.65364362  0.28366219  0.96017029  0.75390225]
 [-0.91113026 -0.83907153  0.0044257   0.84385396  0.90744678]]


### Linear Algebra

In [144]:
a = np.full((2,3),2)
print(a)
b = np.full((3,2),3)
print(b)
c = np.matmul(b, a)
print(c)

[[2 2 2]
 [2 2 2]]
[[3 3]
 [3 3]
 [3 3]]
[[12 12 12]
 [12 12 12]
 [12 12 12]]


In [147]:
# Determinant
I = np.identity(5)
print(np.linalg.det(I))

1.0


# More on: https://numpy.org/doc/stable/reference/routines.linalg.html

## Statistics

In [155]:
a = np.array([[1, 2, 3, 4, 5], [7, 8, 9, 10, 11]])
print(np.min(a))
print(np.max(a))
print(np.min(a, axis = 0))
print(np.min(a, axis = 1))

1
11
[1 2 3 4 5]
[1 7]


In [158]:
print(np.sum(a, axis = 1))

[15 45]


In [160]:
print(np.mean(a))

6.0


In [162]:
print(np.median(a, axis = 1))

[3. 9.]


## Reorginising Arrays

Dimensions are important

In [164]:
before = np.array([[1, 2, 3, 4, 5], [7, 8, 9, 10, 11]])
print(before)
print(before.shape)

[[ 1  2  3  4  5]
 [ 7  8  9 10 11]]
(2, 5)


In [168]:
# change it to 
after = before.reshape(5, 2)
print(after)

[[ 1  2]
 [ 3  4]
 [ 5  7]
 [ 8  9]
 [10 11]]


In [171]:
# Vertically Stacking
v1 = np.array([1, 2, 3])
v2 = np.array([4, 5, 6])
vs = np.vstack([v1,v2, v2, v1, v1])   # We can stack any # Again, size is important
print(vs)

[[1 2 3]
 [4 5 6]
 [4 5 6]
 [1 2 3]
 [1 2 3]]


In [180]:
# Horrizontal stacking -> Size is important
h1 = np.ones((2,4))
h2 = np.zeros((2,2))

hs = np.hstack([h1,h2])
hs

array([[1., 1., 1., 1., 0., 0.],
       [1., 1., 1., 1., 0., 0.]])

## Miscellaneous

### Load Data from a File

In [189]:
file_data = np.genfromtxt("data.txt", delimiter=",")
# Changing the data type
file_data = file_data.astype("int32")
file_data

array([[  1,  13,  21,  11, 196,  75,   4,   3,  34,   6,   7,   8,   0,
          1,   2,   3,   4,   5],
       [  3,  42,  12,  33, 766,  75,   4,  55,   6,   4,   3,   4,   5,
          6,   7,   0,  11,  12],
       [  1,  22,  33,  11, 999,  11,   2,   1,  78,   0,   1,   2,   9,
          8,   7,   1,  76,  88]])

## Boolean Masking and Advanced Indexing

In [190]:
file_data > 50

array([[False, False, False, False,  True,  True, False, False, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False,  True,  True, False,  True, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False,  True, False, False, False,  True,
        False, False, False, False, False, False, False,  True,  True]])

In [191]:
file_data[file_data > 50]

array([196,  75, 766,  75,  55, 999,  78,  76,  88])

In [192]:
# We can index with a list in numpy
a = np.array([1, 2, 3, 4, 5, 6, 7, 8, 9])
a[[1,2,-1]]

array([2, 3, 9])

In [193]:
# It will check vertically if any value is greater than 50
np.any(file_data > 50, axis = 0)

array([False, False, False, False,  True,  True, False,  True,  True,
       False, False, False, False, False, False, False,  True,  True])

In [200]:
# It will check vertically if all values are greater than 50
np.all(file_data > 50, axis = 0)

array([False, False, False, False,  True, False, False, False, False,
       False, False, False, False, False, False, False, False, False])

In [202]:
np.any(file_data > 50, axis = 1)

array([ True,  True,  True])

In [206]:
((file_data > 50) & (file_data < 100))

array([[False, False, False, False, False,  True, False, False, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False,  True, False,  True, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False, False, False, False,  True,
        False, False, False, False, False, False, False,  True,  True]])

In [207]:
# if we will make this not ~
(~((file_data > 50) & (file_data < 100)))

array([[ True,  True,  True,  True,  True, False,  True,  True,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True, False,  True, False,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True,  True,  True, False,
         True,  True,  True,  True,  True,  True,  True, False, False]])

![Screenshot%20%282234%29.png](attachment:Screenshot%20%282234%29.png)