In [1]:
import numpy as np

## The Basics

In [2]:
a = np.array([1, 2, 3])
a

array([1, 2, 3])

In [6]:
b = np.array([[1, 2, 3], [4, 5, 6]])
b

array([[1, 2, 3],
       [4, 5, 6]])

In [7]:
# Get dimension
a.ndim, b.ndim

(1, 2)

In [10]:
# Get Shape
a.shape, b.shape

((3,), (2, 3))

In [11]:
# Get Type
a.dtype, b.dtype

(dtype('int64'), dtype('int64'))

In [12]:
# Get Size
a.itemsize, b.itemsize

(8, 8)

In [13]:
# Get Total Size
a.size, b.size

(3, 6)

In [14]:
# Get No. Of Bytes
a.nbytes, b.nbytes

(24, 48)

## Accessing/Changing specific elements, rows, columns, etc

In [15]:
c = np.array([[1, 2, 3, 4, 5, 6, 7], [8, 9, 10, 11, 12, 13, 14]])
c

array([[ 1,  2,  3,  4,  5,  6,  7],
       [ 8,  9, 10, 11, 12, 13, 14]])

In [16]:
c.shape

(2, 7)

In [19]:
# Get a specific element [r, c]
c[1, 5]

13

In [20]:
# Using negative index
c[1, -2]

13

In [21]:
# Get a specific row
c[0, :]

array([1, 2, 3, 4, 5, 6, 7])

In [22]:
# Get a specific column
c[:, 0]

array([1, 8])

In [23]:
# More fancy way of getting the elements [rowNumber, startIndex:endIndex:stepSize]
c[0, 1:6:2]

array([2, 4, 6])

In [25]:
# Using negative index
c[0, 1:-1:2]

array([2, 4, 6])

In [26]:
# Changing the value of a element
c[1, 5] = 20
c

array([[ 1,  2,  3,  4,  5,  6,  7],
       [ 8,  9, 10, 11, 12, 20, 14]])

In [27]:
# Changing the value of series of elements. Same value.
c[:, 5] = 20
c

array([[ 1,  2,  3,  4,  5, 20,  7],
       [ 8,  9, 10, 11, 12, 20, 14]])

In [28]:
# Changing the value of series of elements. Different values. Make sure the structure is same.
c[:, 5] = [30, 40]
c

array([[ 1,  2,  3,  4,  5, 30,  7],
       [ 8,  9, 10, 11, 12, 40, 14]])

In [29]:
## 3D - Example

In [31]:
d = np.array(
    [
        [
            [1, 2, 3, 4, 5, 6, 7], 
            [8, 9, 10, 11, 12, 13, 14]
        ], 
        [
            [15, 16, 17, 18, 19, 20, 21], 
            [22, 23, 24, 25, 26, 27, 28]
        ]
    ]
)
d

array([[[ 1,  2,  3,  4,  5,  6,  7],
        [ 8,  9, 10, 11, 12, 13, 14]],

       [[15, 16, 17, 18, 19, 20, 21],
        [22, 23, 24, 25, 26, 27, 28]]])

In [32]:
# Get specific element, suggestion is to work outside in
d[0, 1, 4]

12

In [33]:
# Fancey way
d[:, :, 4]

array([[ 5, 12],
       [19, 26]])

In [35]:
# Changing the value of series of elements. Different values. Make sure the structure is same.
d[:, :, 4] = [[50, 50], [60, 60]]
d

array([[[ 1,  2,  3,  4, 50,  6,  7],
        [ 8,  9, 10, 11, 50, 13, 14]],

       [[15, 16, 17, 18, 60, 20, 21],
        [22, 23, 24, 25, 60, 27, 28]]])

## Initializing Different Types of array

In [36]:
# All Zeroes Matrix
np.zeros(5)

array([0., 0., 0., 0., 0.])

In [37]:
# Different shape. 2D
np.zeros([2, 3])

array([[0., 0., 0.],
       [0., 0., 0.]])

In [38]:
# Different shape. 3D
np.zeros([2, 3, 3])

array([[[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]]])

In [39]:
# Different shape. 4D
np.zeros([2, 3, 3, 3])

array([[[[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]],

        [[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]],

        [[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]]],


       [[[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]],

        [[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]],

        [[0., 0., 0.],
         [0., 0., 0.],
         [0., 0., 0.]]]])

In [40]:
# All 1s matrix
np.ones(5)

array([1., 1., 1., 1., 1.])

In [41]:
# Any other number. Takes dimension and then value
np.full((2, 2), 100)


array([[100, 100],
       [100, 100]])

In [43]:
# Also, can use full_like to copy the dimension of the existing array. 
# Only the dimension is copied. Value needs to be provided
np.full_like(b, 4)

array([[4, 4, 4],
       [4, 4, 4]])

In [47]:
# Random decimal numbers
np.random.rand(4, 2, 3)

array([[[0.19674391, 0.39671667, 0.4197725 ],
        [0.88672755, 0.87347619, 0.8047329 ]],

       [[0.82459488, 0.20422025, 0.82591045],
        [0.11956916, 0.96714263, 0.85773225]],

       [[0.31647841, 0.34986361, 0.86283729],
        [0.70560232, 0.49492449, 0.08806503]],

       [[0.47031174, 0.340756  , 0.33057654],
        [0.69923152, 0.55336543, 0.47783711]]])

In [49]:
# Random decimal numbers with shape
np.random.random_sample(b.shape)

array([[0.140705  , 0.27831557, 0.33548438],
       [0.13931402, 0.31929854, 0.60832968]])

In [50]:
# Random integer numbers
np.random.randint(100, size=(3, 3))

array([[37, 63, 29],
       [12,  8, 99],
       [93, 12, 41]])

In [51]:
# Identity matrix. By nature is a square matrix
np.identity(5)

array([[1., 0., 0., 0., 0.],
       [0., 1., 0., 0., 0.],
       [0., 0., 1., 0., 0.],
       [0., 0., 0., 1., 0.],
       [0., 0., 0., 0., 1.]])

In [58]:
# Repeating an array. takes array and no of times to repeat.
np.repeat(b, 3)

array([1, 1, 1, 2, 2, 2, 3, 3, 3, 4, 4, 4, 5, 5, 5, 6, 6, 6])

In [59]:
# Also can provide an axis to repeat on.
np.repeat(b, 3, axis=1)

array([[1, 1, 1, 2, 2, 2, 3, 3, 3],
       [4, 4, 4, 5, 5, 5, 6, 6, 6]])

## Array manipulation

In [61]:
output = np.ones((5, 5))
output

array([[1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.],
       [1., 1., 1., 1., 1.]])

In [65]:
z = np.zeros((3, 3))
z[1, 1] = 9
z

array([[0., 0., 0.],
       [0., 9., 0.],
       [0., 0., 0.]])

In [66]:
output[1:4, 1:4] = z
output

array([[1., 1., 1., 1., 1.],
       [1., 0., 0., 0., 1.],
       [1., 0., 9., 0., 1.],
       [1., 0., 0., 0., 1.],
       [1., 1., 1., 1., 1.]])

In [67]:
output[1:-1, 1:-1] = z
output

array([[1., 1., 1., 1., 1.],
       [1., 0., 0., 0., 1.],
       [1., 0., 9., 0., 1.],
       [1., 0., 0., 0., 1.],
       [1., 1., 1., 1., 1.]])

## Be careful when copying an array. 

In [68]:
# Here b=a represents that "b" points to "a". Any change in "b" will also chamge the "a"
b = a

In [69]:
# To avoid it use "copy"
b = a.copy()

## Mathematics

In [77]:
e = np.array([1, 2, 3, 4])
e

array([1, 2, 3, 4])

In [78]:
# Add
e + 2

array([3, 4, 5, 6])

In [79]:
# Substract
e - 2

array([-1,  0,  1,  2])

In [80]:
# Multiply
e * 2

array([2, 4, 6, 8])

In [81]:
# Divide
e / 2

array([0.5, 1. , 1.5, 2. ])

In [88]:
# Power
e ** 2

array([ 1,  4,  9, 16])

In [94]:
# Take the sin
np.sin(e)

array([ 0.84147098,  0.90929743,  0.14112001, -0.7568025 ])

In [95]:
# Take the cos
np.cos(e)

array([ 0.54030231, -0.41614684, -0.9899925 , -0.65364362])

In [89]:
# Using another array
f = np.array([10, 11, 12, 13])
f

array([10, 11, 12, 13])

In [90]:
e + f

array([11, 13, 15, 17])

In [91]:
f - e

array([9, 9, 9, 9])

In [92]:
e * f

array([10, 22, 36, 52])

In [93]:
e / f

array([0.1       , 0.18181818, 0.25      , 0.30769231])

## Linear Algebra

In [96]:
g = np.ones((2, 3))
g

array([[1., 1., 1.],
       [1., 1., 1.]])

In [97]:
h = np.full((3, 2), 2)
h

array([[2, 2],
       [2, 2],
       [2, 2]])

In [98]:
# Multiplication
np.matmul(g, h)

array([[6., 6.],
       [6., 6.]])

In [100]:
# Find determinant
i = np.identity(3)
np.linalg.det(i)

1.0

In [101]:
## Try other stuff like - 
# Determinant
# Trace
# Singular Vector Decomposition
# Eigenvalues
# Matrix Norm
# Inverst
# Etc..

## Statistics

In [102]:
stats = np.array([[1, 2, 3], [4, 5, 6]])
stats

array([[1, 2, 3],
       [4, 5, 6]])

In [103]:
# Minimumn
np.min(stats)

1

In [104]:
# Maximum
np.max(stats)

6

In [105]:
# Minimumn based onf row. Use axis.
np.min(stats, axis=1)

array([1, 4])

In [106]:
# Maximun based on row. Use axis.
np.max(stats, axis=1)

array([3, 6])

In [107]:
# Sum
np.sum(stats, axis=1)

array([ 6, 15])

In [108]:
# Mean
np.mean(stats)

3.5

# Reorganizing Arrays

In [115]:
before = np.array([[1, 2, 3, 4], [5, 6, 7, 8]])
before

array([[1, 2, 3, 4],
       [5, 6, 7, 8]])

In [119]:
after = before.reshape(4, 2)
after

array([[1, 2],
       [3, 4],
       [5, 6],
       [7, 8]])

In [120]:
after = before.reshape(2, 2, 2)
after

array([[[1, 2],
        [3, 4]],

       [[5, 6],
        [7, 8]]])

In [122]:
# Veritcally stacking vectors
v1 = np.array([1, 2, 3, 4])
v2 = np.array([5, 6, 6, 8])
v1, v2

(array([1, 2, 3, 4]), array([5, 6, 6, 8]))

In [123]:
np.vstack([v1, v2])

array([[1, 2, 3, 4],
       [5, 6, 6, 8]])

In [124]:
np.vstack([v1, v2, v1, v2])

array([[1, 2, 3, 4],
       [5, 6, 6, 8],
       [1, 2, 3, 4],
       [5, 6, 6, 8]])

In [125]:
# Horizontal stack
np.hstack([v1, v2])

array([1, 2, 3, 4, 5, 6, 6, 8])

In [126]:
np.hstack([v1, v2, v1, v2])

array([1, 2, 3, 4, 5, 6, 6, 8, 1, 2, 3, 4, 5, 6, 6, 8])

## Miscellaneous

In [143]:
# Load data from file
filedata = np.genfromtxt("numpy-example-data", delimiter=",")
print(filedata)

# In different Type
print(filedata.astype("int32")) # Creates a copy and not modifies the existing

[[ 1.  2.  3.  4. 50.  6.  7.  8.  9.]
 [ 1.  2.  3.  4.  5. 60.  7.  8.  9.]
 [ 1.  2.  3.  4.  5.  6. 70.  8.  9.]]
[[ 1  2  3  4 50  6  7  8  9]
 [ 1  2  3  4  5 60  7  8  9]
 [ 1  2  3  4  5  6 70  8  9]]


## Masking and Advanced Indexing

In [144]:
# Boolean Masking
filedata > 50

array([[False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False,  True, False, False, False],
       [False, False, False, False, False, False,  True, False, False]])

In [145]:
filedata < 50

array([[ True,  True,  True,  True, False,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True, False,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True, False,  True,  True]])

In [146]:
# Find all
np.all(filedata > 50, axis=0)

array([False, False, False, False, False, False, False, False, False])

In [147]:
# Find any
np.any(filedata > 50, axis=0)

array([False, False, False, False, False,  True,  True, False, False])

In [148]:
# Find data in-between
((filedata > 50) & (filedata < 100))

array([[False, False, False, False, False, False, False, False, False],
       [False, False, False, False, False,  True, False, False, False],
       [False, False, False, False, False, False,  True, False, False]])

In [149]:
# Find reverse
(~(filedata > 50) & (filedata < 100))

array([[ True,  True,  True,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True, False,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True, False,  True,  True]])

In [153]:
# Indexing
filedata[[1,2]]

array([[ 1.,  2.,  3.,  4.,  5., 60.,  7.,  8.,  9.],
       [ 1.,  2.,  3.,  4.,  5.,  6., 70.,  8.,  9.]])

In [156]:
# Indexing in a range
filedata[0:1,0:2]

array([[1., 2.]])

In [158]:
# Indexing specifics
filedata[[0,1],[0,2]]

array([1., 3.])