# Data Science Basics - Numpy

In [None]:
import numpy as np

## The Basics

In [None]:
a = np.array([1, 2, 3])
a

In [None]:
b = np.array([[1, 2, 3], [4, 5, 6]])
b

In [None]:
# Get dimension
a.ndim, b.ndim

In [None]:
# Get Shape
a.shape, b.shape

In [None]:
# Get Type
a.dtype, b.dtype

In [None]:
# Get Size
a.itemsize, b.itemsize

In [None]:
# Get Total Size
a.size, b.size

In [None]:
# Get No. Of Bytes
a.nbytes, b.nbytes

## Accessing/Changing specific elements, rows, columns, etc

In [None]:
c = np.array([[1, 2, 3, 4, 5, 6, 7], [8, 9, 10, 11, 12, 13, 14]])
c

In [None]:
c.shape

In [None]:
# Get a specific element [r, c]
c[1, 5]

In [None]:
# Using negative index
c[1, -2]

In [None]:
# Get a specific row
c[0, :]

In [None]:
# Get a specific column
c[:, 0]

In [None]:
# More fancy way of getting the elements [rowNumber, startIndex:endIndex:stepSize]
c[0, 1:6:2]

In [None]:
# Using negative index
c[0, 1:-1:2]

In [None]:
# Changing the value of a element
c[1, 5] = 20
c

In [None]:
# Changing the value of series of elements. Same value.
c[:, 5] = 20
c

In [None]:
# Changing the value of series of elements. Different values. Make sure the structure is same.
c[:, 5] = [30, 40]
c

In [None]:
## 3D - Example

In [None]:
d = np.array(
    [
        [[1, 2, 3, 4, 5, 6, 7], [8, 9, 10, 11, 12, 13, 14]],
        [[15, 16, 17, 18, 19, 20, 21], [22, 23, 24, 25, 26, 27, 28]],
    ]
)
d

In [None]:
# Get specific element, suggestion is to work outside in
d[0, 1, 4]

In [None]:
# Fancey way
d[:, :, 4]

In [None]:
# Changing the value of series of elements. Different values. Make sure the structure is same.
d[:, :, 4] = [[50, 50], [60, 60]]
d

## Initializing Different Types of array

In [None]:
# All Zeroes Matrix
np.zeros(5)

In [None]:
# Different shape. 2D
np.zeros([2, 3])

In [None]:
# Different shape. 3D
np.zeros([2, 3, 3])

In [None]:
# Different shape. 4D
np.zeros([2, 3, 3, 3])

In [None]:
# All 1s matrix
np.ones(5)

In [None]:
# Any other number. Takes dimension and then value
np.full((2, 2), 100)

In [None]:
# Also, can use full_like to copy the dimension of the existing array.
# Only the dimension is copied. Value needs to be provided
np.full_like(b, 4)

In [None]:
# Random decimal numbers
np.random.rand(4, 2, 3)

In [None]:
# Random decimal numbers with shape
np.random.random_sample(b.shape)

In [None]:
# Random integer numbers
np.random.randint(100, size=(3, 3))

In [None]:
# Identity matrix. By nature is a square matrix
np.identity(5)

In [None]:
# Repeating an array. takes array and no of times to repeat.
np.repeat(b, 3)

In [None]:
# Also can provide an axis to repeat on.
np.repeat(b, 3, axis=1)

## Array manipulation

In [None]:
output = np.ones((5, 5))
output

In [None]:
z = np.zeros((3, 3))
z[1, 1] = 9
z

In [None]:
output[1:4, 1:4] = z
output

In [None]:
output[1:-1, 1:-1] = z
output

## Be careful when copying an array. 

In [None]:
# Here b=a represents that "b" points to "a". Any change in "b" will also chamge the "a"
b = a

In [None]:
# To avoid it use "copy"
b = a.copy()

## Mathematics

In [None]:
e = np.array([1, 2, 3, 4])
e

In [None]:
# Add
e + 2

In [None]:
# Substract
e - 2

In [None]:
# Multiply
e * 2

In [None]:
# Divide
e / 2

In [None]:
# Power
e ** 2

In [None]:
# Take the sin
np.sin(e)

In [None]:
# Take the cos
np.cos(e)

In [None]:
# Using another array
f = np.array([10, 11, 12, 13])
f

In [None]:
e + f

In [None]:
f - e

In [None]:
e * f

In [None]:
e / f

## Linear Algebra

In [None]:
g = np.ones((2, 3))
g

In [None]:
h = np.full((3, 2), 2)
h

In [None]:
# Multiplication
np.matmul(g, h)

In [None]:
# Find determinant
i = np.identity(3)
np.linalg.det(i)

In [None]:
## Try other stuff like -
# Determinant
# Trace
# Singular Vector Decomposition
# Eigenvalues
# Matrix Norm
# Inverst
# Etc..

## Statistics

In [None]:
stats = np.array([[1, 2, 3], [4, 5, 6]])
stats

In [None]:
# Minimumn
np.min(stats)

In [None]:
# Maximum
np.max(stats)

In [None]:
# Minimumn based onf row. Use axis.
np.min(stats, axis=1)

In [None]:
# Maximun based on row. Use axis.
np.max(stats, axis=1)

In [None]:
# Sum
np.sum(stats, axis=1)

In [None]:
# Mean
np.mean(stats)

# Reorganizing Arrays

In [None]:
before = np.array([[1, 2, 3, 4], [5, 6, 7, 8]])
before

In [None]:
after = before.reshape(4, 2)
after

In [None]:
after = before.reshape(2, 2, 2)
after

In [None]:
# Veritcally stacking vectors
v1 = np.array([1, 2, 3, 4])
v2 = np.array([5, 6, 6, 8])
v1, v2

In [None]:
np.vstack([v1, v2])

In [None]:
np.vstack([v1, v2, v1, v2])

In [None]:
# Horizontal stack
np.hstack([v1, v2])

In [None]:
np.hstack([v1, v2, v1, v2])

## Miscellaneous

In [None]:
# Load data from file
filedata = np.genfromtxt("data/numpy-example-data", delimiter=",")
print(filedata)

# In different Type
print(filedata.astype("int32"))  # Creates a copy and not modifies the existing

## Masking and Advanced Indexing

In [None]:
# Boolean Masking
filedata > 50

In [None]:
filedata < 50

In [None]:
# Find all
np.all(filedata > 50, axis=0)

In [None]:
# Find any
np.any(filedata > 50, axis=0)

In [None]:
# Find data in-between
((filedata > 50) & (filedata < 100))

In [None]:
# Find reverse
(~(filedata > 50) & (filedata < 100))

In [None]:
# Indexing
filedata[[1, 2]]

In [None]:
# Indexing in a range
filedata[0:1, 0:2]

In [None]:
# Indexing specifics
filedata[[0, 1], [0, 2]]