# Load in NumPy

In [1]:
import numpy as np

## The Basics

In [3]:
a = np.array([1,2,3]) # 1D
print(a)

[1 2 3]


In [4]:
b = np.array([[9.0,8.0,7.0], [6.0,5.0,4.0]]) # 2D
print(b)

[[9. 8. 7.]
 [6. 5. 4.]]


In [5]:
# how to get dimension
a.ndim # number dimension

1

In [6]:
b.ndim

2

In [7]:
# get shape
a.shape # vectors

(3,)

In [8]:
b.shape

(2, 3)

In [9]:
# get type
a.dtype # data type

dtype('int64')

In [10]:
# specify data type when you want efficience
a = np.array([1,2,3], dtype='int16') # 1D
print(a.dtype)

int16


In [11]:
# get size
a.itemsize # bytes

2

In [13]:
b.itemsize

8

In [14]:
# get total size
a.size * a.itemsize

6

In [15]:
a.nbytes

6

## Accessing/Changing specific elements, rows, columns, etc

In [16]:
a = np.array([[1,2,3,4,5,6,7],[8,9,10,11,12,13,14]])
print(a)

[[ 1  2  3  4  5  6  7]
 [ 8  9 10 11 12 13 14]]


In [17]:
a.shape

(2, 7)

In [19]:
# get a specific element [r, c]
a[1, 5]

13

In [20]:
a[1, -2] # negative index available

13

In [21]:
# get a specific row
a[0, :]

array([1, 2, 3, 4, 5, 6, 7])

In [22]:
# get a specific column
a[:, 2]

array([ 3, 10])

In [23]:
# getting a little more fancy [start:end:step]
a[0, 1:5:2]

array([2, 4])

In [24]:
a[0, 1:-1:2]

array([2, 4, 6])

In [25]:
a[1,5] = 20
print(a)

[[ 1  2  3  4  5  6  7]
 [ 8  9 10 11 12 20 14]]


In [26]:
a[:,2] = 5
print(a)

[[ 1  2  5  4  5  6  7]
 [ 8  9  5 11 12 20 14]]


In [27]:
a[:,2] = [1,2]
print(a)

[[ 1  2  1  4  5  6  7]
 [ 8  9  2 11 12 20 14]]


3D example

In [28]:
b = np.array([[[1,2],[3,4]],[[5,6],[7,8]]])
print(b)

[[[1 2]
  [3 4]]

 [[5 6]
  [7 8]]]


In [29]:
#get specific element (work outside in)
b[0, 1, 1]

4

In [30]:
b[0,1,:]

array([3, 4])

In [31]:
b[:,1,:]

array([[3, 4],
       [7, 8]])

In [32]:
# replace
b[:,1,:] = [[9,9],[8,8]]
print(b)

[[[1 2]
  [9 9]]

 [[5 6]
  [8 8]]]


## Initializing Different Types of Arrays

In [33]:
# all 0s matrix
np.zeros(5)

array([0., 0., 0., 0., 0.])

In [34]:
np.zeros((2,3))

array([[0., 0., 0.],
       [0., 0., 0.]])

In [35]:
np.zeros((2,3,3))

array([[[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]]])

In [37]:
# All 1s matrix
np.ones((4,2,2), dtype='int32')

array([[[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]],

       [[1, 1],
        [1, 1]]], dtype=int32)

In [39]:
# any other number
np.full((2,2), 99, dtype='float32') # shape, value

array([[99., 99.],
       [99., 99.]], dtype=float32)

In [40]:
# any other number (full_like)
a = np.array([[1,2,3,4,5,6,7],[8,9,10,11,12,13,14]])
np.full_like(a, 4)

array([[4, 4, 4, 4, 4, 4, 4],
       [4, 4, 4, 4, 4, 4, 4]])

In [41]:
# random decimal numbers
np.random.rand(4,2) # not tuple

array([[0.38965391, 0.58368979],
       [0.86804978, 0.77532409],
       [0.03702242, 0.04016638],
       [0.46555065, 0.44190141]])

In [42]:
np.random.rand(4,2,3)

array([[[0.73461323, 0.2090606 , 0.06536618],
        [0.61523785, 0.39469707, 0.73055055]],

       [[0.78983593, 0.72629261, 0.0175403 ],
        [0.80702904, 0.32091303, 0.71303317]],

       [[0.43062344, 0.08292238, 0.3192065 ],
        [0.21817597, 0.701315  , 0.84001233]],

       [[0.04679349, 0.46187116, 0.57887958],
        [0.08434786, 0.17660624, 0.71195929]]])

In [43]:
# if you want to use shape
np.random.random_sample(a.shape)

array([[0.27738736, 0.63411356, 0.85400852, 0.64689165, 0.14832233,
        0.54362615, 0.42984819],
       [0.55338422, 0.3796881 , 0.8735173 , 0.15349586, 0.49152942,
        0.679417  , 0.22652824]])

In [44]:
# random integer values
np.random.randint(7)

6

In [45]:
np.random.randint(7, size=(3,3))

array([[1, 3, 6],
       [6, 4, 4],
       [5, 1, 5]])

In [46]:
np.random.randint(4, 7, size=(3,3)) # 4 to 7 random integers

array([[6, 6, 4],
       [5, 4, 5],
       [5, 5, 4]])

In [47]:
# the identity matrix
np.identity(3) 

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [48]:
arr = np.array([1,2,3])
r1 = np.repeat(arr,3)
print(r1)

[1 1 1 2 2 2 3 3 3]


In [49]:
arr = np.array([[1,2,3]])
r1 = np.repeat(arr,3, axis=0) # axis : rows
print(r1)

[[1 2 3]
 [1 2 3]
 [1 2 3]]


In [51]:
arr = np.array([[1,2,3]])
r1 = np.repeat(arr,3, axis=1) # axis : columns
print(r1)

[[1 1 1 2 2 2 3 3 3]]


In [56]:
task = np.ones((5,5), dtype='int8')
task[1:4, 1:4] = 0
task[2,2] = 9
print(task)

[[1 1 1 1 1]
 [1 0 0 0 1]
 [1 0 9 0 1]
 [1 0 0 0 1]
 [1 1 1 1 1]]


In [58]:
output = np.ones((5,5))
print(output)

z = np.zeros((3,3))
z[1,1] = 9
print(z)

output[1:-1,1:-1] = z
print(output)

[[1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]
 [1. 1. 1. 1. 1.]]
[[0. 0. 0.]
 [0. 9. 0.]
 [0. 0. 0.]]
[[1. 1. 1. 1. 1.]
 [1. 0. 0. 0. 1.]
 [1. 0. 9. 0. 1.]
 [1. 0. 0. 0. 1.]
 [1. 1. 1. 1. 1.]]


##### be careful when copying arrays !!!

In [59]:
a = np.array([1,2,3])
print(a)

[1 2 3]


In [60]:
# copy
b = a # pointing exactly same thing
print(b)

[1 2 3]


In [61]:
b[0] = 100
print("a:",a)
print("b:",b)

a: [100   2   3]
b: [100   2   3]


In [62]:
b = a.copy()
b[0] = 200
print("a:",a)
print("b:",b)

a: [100   2   3]
b: [200   2   3]


## Mathematics

In [63]:
a = np.array([1,2,3,4])
print(a)

[1 2 3 4]


In [64]:
a + 2

array([3, 4, 5, 6])

In [65]:
a - 2

array([-1,  0,  1,  2])

In [66]:
a * 2

array([2, 4, 6, 8])

In [67]:
a / 2

array([0.5, 1. , 1.5, 2. ])

In [69]:
b = np.array([1,0,1,0])
a + b

array([2, 2, 4, 4])

In [70]:
a ** 2

array([ 1,  4,  9, 16])

In [71]:
# take the sin
np.sin(a)

array([ 0.84147098,  0.90929743,  0.14112001, -0.7568025 ])

In [72]:
np.cos(a)

array([ 0.54030231, -0.41614684, -0.9899925 , -0.65364362])

##### Linear Algebra

In [73]:
a = np.ones((2,3))
print(a)

b = np.full((3,2), 2)
print(b)

a * b # error : size error

[[1. 1. 1.]
 [1. 1. 1.]]
[[2 2]
 [2 2]
 [2 2]]


In [74]:
np.matmul(a,b)

array([[6., 6.],
       [6., 6.]])

In [76]:
# find the determinant
c = np.identity(3)
np.linalg.det(c)

1.0

In [77]:
# other things with linalg
# trace, SVD, eigenvalues, norm, invers, etc ...

##### Statistics

In [78]:
stats = np.array([[1,2,3],[4,5,6]])
stats

array([[1, 2, 3],
       [4, 5, 6]])

In [79]:
np.min(stats)

1

In [82]:
np.min(stats, axis=0)

array([1, 2, 3])

In [83]:
np.min(stats, axis=1)

array([1, 4])

In [80]:
np.max(stats)

6

In [84]:
np.sum(stats)

21

In [85]:
np.sum(stats, axis=0)

array([5, 7, 9])

In [86]:
np.sum(stats, axis=1)

array([ 6, 15])

## Reorganizing Arrays

In [87]:
before = np.array([[1,2,3,4],[5,6,7,8]])
print(before)

[[1 2 3 4]
 [5 6 7 8]]


In [88]:
after = before.reshape((8,1))
print(after)

[[1]
 [2]
 [3]
 [4]
 [5]
 [6]
 [7]
 [8]]


In [89]:
after = before.reshape((4,2))
print(after)

[[1 2]
 [3 4]
 [5 6]
 [7 8]]


In [90]:
after = before.reshape((2,2,2))
print(after)

[[[1 2]
  [3 4]]

 [[5 6]
  [7 8]]]


In [91]:
# vertically stacking vectors
v1 = np.array([1,2,3,4])
v2 = np.array([5,6,7,8])

np.vstack([v1,v2])

array([[1, 2, 3, 4],
       [5, 6, 7, 8]])

In [92]:
np.vstack([v1,v2,v1,v2])

array([[1, 2, 3, 4],
       [5, 6, 7, 8],
       [1, 2, 3, 4],
       [5, 6, 7, 8]])

In [93]:
# horizontally stacking vectors
h1 = np.ones((2,4))
h2 = np.zeros((2,2))

np.hstack((h1, h2))

array([[1., 1., 1., 1., 0., 0.],
       [1., 1., 1., 1., 0., 0.]])

## Miscellaneous

##### Load Data from File

In [95]:
filedata = np.genfromtxt('data.txt', delimiter=',')
print(filedata)

[[  1.  13.  21.  11. 196.  75.   4.   3.  34.   6.   7.   8.   0.   1.
    2.   3.   4.   5.]
 [  3.  42.  12.  33. 766.  75.   4.  55.   6.   4.   3.   4.   5.   6.
    7.   0.  11.  12.]
 [  1.  22.  33.  11. 999.  11.   2.   1.  78.   0.   1.   2.   9.   8.
    7.   1.  76.  88.]]


In [96]:
filedata.astype('int32') # copy (do not change filedata)

array([[  1,  13,  21,  11, 196,  75,   4,   3,  34,   6,   7,   8,   0,
          1,   2,   3,   4,   5],
       [  3,  42,  12,  33, 766,  75,   4,  55,   6,   4,   3,   4,   5,
          6,   7,   0,  11,  12],
       [  1,  22,  33,  11, 999,  11,   2,   1,  78,   0,   1,   2,   9,
          8,   7,   1,  76,  88]], dtype=int32)

##### Boolean Masking and Advanced Indexing

In [97]:
filedata > 50

array([[False, False, False, False,  True,  True, False, False, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False,  True,  True, False,  True, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False,  True, False, False, False,  True,
        False, False, False, False, False, False, False,  True,  True]])

In [98]:
filedata[filedata > 50]

array([196.,  75., 766.,  75.,  55., 999.,  78.,  76.,  88.])

In [99]:
# you can index with a list in NumPy
a = np.array([1,2,3,4,5,6,7,8,9])
a[[1,2,8]] # index list -> True or False

array([2, 3, 9])

In [100]:
np.any(filedata > 50, axis=0)

array([False, False, False, False,  True,  True, False,  True,  True,
       False, False, False, False, False, False, False,  True,  True])

In [101]:
np.any(filedata > 50, axis=1)

array([ True,  True,  True])

In [103]:
np.all(filedata > 50, axis=0)

array([False, False, False, False,  True, False, False, False, False,
       False, False, False, False, False, False, False, False, False])

In [104]:
((filedata > 50) & (filedata < 100))

array([[False, False, False, False, False,  True, False, False, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False,  True, False,  True, False,
        False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False, False, False, False,  True,
        False, False, False, False, False, False, False,  True,  True]])

In [105]:
(~((filedata > 50) & (filedata < 100)))

array([[ True,  True,  True,  True,  True, False,  True,  True,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True, False,  True, False,  True,
         True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True,  True,  True, False,
         True,  True,  True,  True,  True,  True,  True, False, False]])

In [106]:
task2 = np.array([
    [1,2,3,4,5],
    [6,7,8,9,10],
    [11,12,13,14,15],
    [16,17,18,19,20],
    [21,22,23,24,25],
    [26,27,28,29,30]
])
print(task2)

[[ 1  2  3  4  5]
 [ 6  7  8  9 10]
 [11 12 13 14 15]
 [16 17 18 19 20]
 [21 22 23 24 25]
 [26 27 28 29 30]]


In [107]:
task2[2:4, 0:2]

array([[11, 12],
       [16, 17]])

In [108]:
task2[[0,1,2,3],[1,2,3,4]]

array([ 2,  8, 14, 20])

In [109]:
task2[[0,-2,-1],3:]

array([[ 4,  5],
       [24, 25],
       [29, 30]])