# Learning NumPy
Notebook in accordance with https://youtu.be/GB9ByFAIAH4?t=558 (timestamp: 9:17 - 50:20)
![image.png](attachment:image.png)

In [2]:
import numpy as np

## Basics

In [11]:
a = np.array([1,2,3],dtype='int16')
print(a)

[1 2 3]


In [5]:
b = np.array([[9.0,8.0,7.0],[6.0,5.0,4.0]])
print(b)

[[9. 8. 7.]
 [6. 5. 4.]]


In [6]:
#Get Dimension
a.ndim

1

In [9]:
# Get Shape
b.shape

(2, 3)

In [12]:
# Get Type
a.dtype

dtype('int16')

In [14]:
# Get Size
a.itemsize

2

In [15]:
# No. of items
a.size

3

In [16]:
# Get total size
a.size*a.itemsize #Method-1
a.nbytes          #Method-2

6

In [18]:
a = np.array([1,2,3])
# Get Type
print(a.dtype)
# Get Size
print(a.itemsize)
# No. of items
print(a.size)
# Get total size
print(a.size*a.itemsize) #Method-1
print(a.nbytes)          #Method-2

int32
4
3
12
12


## Accessing/Changing specific elements, rows, columns etc.

In [19]:
a = np.array([[1,2,3,4,5,6,7],[8,9,10,11,12,13,14]])
print(a)

[[ 1  2  3  4  5  6  7]
 [ 8  9 10 11 12 13 14]]


In [20]:
a.shape

(2, 7)

In [23]:
# Get a specific element: var[row,col]
a[1,5]   #With negative notation as a[1,-2]

13

In [24]:
# Get a specific row: var[row, :]
a[0,:]

array([1, 2, 3, 4, 5, 6, 7])

In [25]:
# Get a specific column: var[:, col]
a[:, 2]

array([ 3, 10])

In [26]:
# Slicing: var[row, startindex:endindex:stepsize] || var[startindex:endindex:stepsize, col]
a[0, 1:6:2]  #can also write 6 as -1

array([2, 4, 6])

In [27]:
# To change:
a[1,5]=20
a

array([[ 1,  2,  3,  4,  5,  6,  7],
       [ 8,  9, 10, 11, 12, 20, 14]])

In [28]:
a[:,2]=5
a

array([[ 1,  2,  5,  4,  5,  6,  7],
       [ 8,  9,  5, 11, 12, 20, 14]])

In [29]:
a[:,2]= [1,2]
a

array([[ 1,  2,  1,  4,  5,  6,  7],
       [ 8,  9,  2, 11, 12, 20, 14]])

## 3D Array

In [31]:
b = np.array([[[1,2],[3,4]],[[5,6],[7,8]]])
b

array([[[1, 2],
        [3, 4]],

       [[5, 6],
        [7, 8]]])

In [32]:
# Get specific element: Work outside in
b[0, 1, 1]

4

In [33]:
b[:,1,:]

array([[3, 4],
       [7, 8]])

In [34]:
# Replace
b[:,1,:] = [[9,9],[8,8]]

In [35]:
b

array([[[1, 2],
        [9, 9]],

       [[5, 6],
        [8, 8]]])

# Initializing Different Types of Arrays

In [36]:
# Initializing with zeros: np.zeros(shape)
np.zeros((2,3))

array([[0., 0., 0.],
       [0., 0., 0.]])

In [37]:
# Initializing with ones: np.ones(shape)
np.ones((4,2,2),dtype='int32')

array([[[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]]])

In [38]:
# Any other number: np.full(shape, value)
np.full((2,2), 99)

array([[99, 99],
       [99, 99]])

In [41]:
# To reuse existing shape: np.full_like(var, val)
np.full_like(a, 4) # Equivalent to np.full(var.shape, val)

array([[4, 4, 4, 4, 4, 4, 4],
       [4, 4, 4, 4, 4, 4, 4]])

In [44]:
# Random Decimal Nos: np.random.rand(size)
np.random.rand(4,2,3)

array([[[0.06033326, 0.00525855, 0.43887244],
        [0.48884442, 0.60686616, 0.779814  ]],

       [[0.2795797 , 0.00711681, 0.95376401],
        [0.89221216, 0.57073157, 0.88355813]],

       [[0.93785893, 0.85631924, 0.10333679],
        [0.65539395, 0.57266937, 0.64265797]],

       [[0.42141656, 0.96081168, 0.66398241],
        [0.26291709, 0.27861281, 0.38124641]]])

In [45]:
# To reuse existing shape in random: np.random.random_sample(var.shape)
np.random.random_sample(a.shape)

array([[0.03128886, 0.25521201, 0.00417884, 0.21148877, 0.20187151,
        0.62109664, 0.74686523],
       [0.9563695 , 0.97761035, 0.84466685, 0.31871329, 0.50122739,
        0.43267439, 0.19368071]])

In [47]:
# Random Integer Nos: np.random.randint(startvalue, endvalue, size) : Takes startvalue 0 by default; endvalue exclusive
np.random.randint(7, size=(3,3))

array([[3, 0, 3],
       [4, 3, 4],
       [6, 1, 4]])

In [48]:
# Identity Matrix: np.identity(size)
np.identity(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [49]:
# Repeating arrays: np.repeat(arr, no_of_repeatitions, axis)
arr = np.array([[1,2,3]])
r1 = np.repeat(arr,3,axis = 0)

In [50]:
r1

array([[1, 2, 3],
       [1, 2, 3],
       [1, 2, 3]])

## Practice Question:
Create the following array:
$$
\begin{bmatrix} 
1 & 1 & 1 & 1 & 1 \\
1 & 0 & 0 & 0 & 1 \\
1 & 0 & 9 & 0 & 1 \\
1 & 0 & 0 & 0 & 1 \\
1 & 1 & 1 & 1 & 1 \\
\end{bmatrix}
\quad
$$

In [53]:
#Solution
output = np.ones((5,5), dtype='int32')
mid = np.zeros((3,3), dtype='int32')
mid[1,1] = 9
output[1:-1, 1:-1] = mid
print(output)

[[1 1 1 1 1]
 [1 0 0 0 1]
 [1 0 9 0 1]
 [1 0 0 0 1]
 [1 1 1 1 1]]


### Be careful while copying arrays!!

In [54]:
a = np.array([1,2,3])
b = a
print(a,b)

[1 2 3] [1 2 3]


In [55]:
b[0] = 100
print(a,b)

[100   2   3] [100   2   3]


Oops!! The value of 'a' also changed on change in b as b points to same thing as a; not make a copy. So, to prevent this, we use the copy() function.

In [56]:
#Using copy t initialize b
a = np.array([1,2,3])
b = a.copy()
b[0] = 100
print(a)

[1 2 3]


## Mathematics

In [57]:
a = np.array([1,2,3,4])
a

array([1, 2, 3, 4])

In [58]:
a + 2

array([3, 4, 5, 6])

In [59]:
a - 2

array([-1,  0,  1,  2])

In [60]:
a*2

array([2, 4, 6, 8])

In [61]:
a/2

array([0.5, 1. , 1.5, 2. ])

In [62]:
b = np.array([1,0,1,0])
a + b

array([2, 2, 4, 4])

In [63]:
a**2

array([ 1,  4,  9, 16], dtype=int32)

In [64]:
# Take the sin
np.sin(a)

array([ 0.84147098,  0.90929743,  0.14112001, -0.7568025 ])

In [65]:
np.cos(a)

array([ 0.54030231, -0.41614684, -0.9899925 , -0.65364362])

In [66]:
# For a lot more (https://docs.scipy.org/doc/numpy/reference/routines.math.html)

## Linear Algebra

In [67]:
a = np.ones((2,3))
print(a)

b = np.full((3,2), 2)
print(b)

np.matmul(a,b)

[[1. 1. 1.]
 [1. 1. 1.]]
[[2 2]
 [2 2]
 [2 2]]


array([[6., 6.],
       [6., 6.]])

In [68]:
# Find the determinant
c = np.identity(3)
np.linalg.det(c)

1.0

In [69]:
## Reference docs (https://docs.scipy.org/doc/numpy/reference/routines.linalg.html)

# Determinant
# Trace
# Singular Vector Decomposition
# Eigenvalues
# Matrix Norm
# Inverse
# Etc...

## Statistics

In [70]:
stats = np.array([[1,2,3],[4,5,6]])
stats

array([[1, 2, 3],
       [4, 5, 6]])

In [71]:
np.min(stats)

1

In [73]:
np.max(stats, axis=1) # Max of each row(axis=1)

array([3, 6])

In [74]:
np.sum(stats, axis=0)

array([5, 7, 9])

## Reorganizing Arrays

In [77]:
before = np.array([[1,2,3,4],[5,6,7,8]])
print(before)

after = before.reshape((8,1)) # Could also take (4,2) or (2,2,2)
print(after)

[[1 2 3 4]
 [5 6 7 8]]
[[1]
 [2]
 [3]
 [4]
 [5]
 [6]
 [7]
 [8]]


In [78]:
after = before.reshape((2,3))
print(after)

ValueError: cannot reshape array of size 8 into shape (2,3)

In [79]:
# Vertically stacking vectors
v1 = np.array([1,2,3,4])
v2 = np.array([5,6,7,8])

np.vstack([v1,v2,v1,v2])

array([[1, 2, 3, 4],
       [5, 6, 7, 8],
       [1, 2, 3, 4],
       [5, 6, 7, 8]])

In [80]:
# Horizontal  stack
h1 = np.ones((2,4))
h2 = np.zeros((2,2))

np.hstack((h1,h2))

array([[1., 1., 1., 1., 0., 0.],
       [1., 1., 1., 1., 0., 0.]])

## Miscellaneous

### Load Data from File

In [82]:
filedata = np.genfromtxt('data.txt', delimiter=',')
filedata = filedata.astype('int32')
print(filedata)

[[  1  13  21  11 196  75   4   3  34   6   7   8   0   1   2   3   4   5]
 [  3  42  12  33 766  75   4  55   6   4   3   4   5   6   7   0  11  12]
 [  1  22  33  11 999  11   2   1  78   0   1   2   9   8   7   1  76  88]]


### Boolean Masking and Advanced Indexing

In [83]:
(~((filedata > 50) & (filedata < 100)))

array([[ True,  True,  True,  True,  True, False,  True,  True,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True, False,  True, False,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True,  True,  True, False,
         True,  True,  True,  True,  True,  True,  True, False, False]])

----------------------------------------------------------------------------------------------------------------------------

In [3]:
np.arange(7,0,-3)

array([7, 4, 1])

In [4]:
np.flip(np.arange(1, 8, 3))

array([7, 4, 1])

In [9]:
a=np.array([[1,2],[3,4]])

In [10]:
b= a.sum(axis=1)

In [12]:
np.array(['a','b','c'])*2

TypeError: ufunc 'multiply' did not contain a loop with signature matching types dtype('<U3') dtype('<U3') dtype('<U3')