<a href="https://colab.research.google.com/github/sbogde/pandamonium/blob/main/dmi_00_numpy_00.ipynb" target="_parent"><img src="https://colab.research.google.com/assets/colab-badge.svg" alt="Open In Colab"/></a>

## Arrays vs Lists

In [1]:
import numpy as np

In [2]:
L = [1,2,3]

In [3]:
A = np.array([1,2,3])

In [4]:
for e in L:
  print(e)

1
2
3


In [5]:
for e in A:
  print(e)

1
2
3


In [6]:
L.append(4)

In [7]:
L

[1, 2, 3, 4]

In [8]:
# A.append(4) # doesn't work

In [9]:
# A = np.append(A, 5)
# A

In [10]:
L + [5]

[1, 2, 3, 4, 5]

In [11]:
A + np.array([4]) # the same as A + np.array([4, 4, 4])

array([5, 6, 7])

In [12]:
A + np.array([4,5,6])

array([5, 7, 9])

In [13]:
A + np.array([4,5]) # doesn't work

ValueError: operands could not be broadcast together with shapes (3,) (2,) 

In [None]:
2 * A

In [None]:
2 * L

In [None]:
L + L

In [None]:
L2 = []
for e in L:
  L2.append(e + 3)

In [None]:
L2

In [None]:
L2 = [e + 3 for e in L]

In [None]:
L2

In [None]:
L2 = []
for e in L:
  L2.append(e**2)

In [None]:
L2

In [None]:
A**2

In [None]:
np.sqrt(A)

In [None]:
np.log(A)

In [None]:
np.exp(A)

In [None]:
np.tanh(A)

## The Dot Product

$$ a \cdot b = a^T b = \sum_{d=1}^D a_d b_d $$

In [14]:
a = np.array([1,2])
b = np.array([3,4])

In [15]:
dot = 0
for e, f in zip(a, b):
  dot += e*f
dot

11

In [16]:
# use integer index
dot = 0
for i in range(len(a)):
  dot += a[i] * b[i]
dot

11

In [17]:
a * b

array([3, 8])

In [18]:
np.sum(a * b)

11

In [19]:
(a * b).sum()

11

In [20]:
np.dot(a, b)

11

In [21]:
a.dot(b)

11

In [22]:
b.dot(a)

11

In [23]:
a @ b

11

$$ a^T b = \left\lVert a \right\rVert \left\lVert b \right\rVert \cos \theta_{ab}$$

$$ \cos \theta_{ab} = \frac{a^T b}{\left\lVert a \right\rVert \left\lVert b \right\rVert} $$

$$ \left\lVert a \right\rVert = \sqrt{\sum_{d=1}^D a_d^2 } $$

In [24]:
amag = np.sqrt((a * a).sum())
amag

2.23606797749979

In [25]:
amag = np.linalg.norm(amag)
amag

2.23606797749979

In [26]:
cosangle = a.dot(b) / (np.linalg.norm(a) * np.linalg.norm(b))

In [27]:
cosangle

0.9838699100999074

In [28]:
angle = np.arccos(cosangle)
angle

0.17985349979247847

## Speed Test

In [32]:
## speed comparison ##
import numpy as np
from datetime import datetime

# note: you can also use %timeit

a = np.random.randn(100)
b = np.random.randn(100)
T = 100000

def slow_dot_product(a, b):
  result = 0
  for e, f in zip(a, b):
    result += e*f
  return result

t0 = datetime.now()
for t in range(T):
  slow_dot_product(a, b)
dt1 = datetime.now() - t0

t0 = datetime.now()
for t in range(T):
  a.dot(b)
dt2 = datetime.now() - t0

print("dt1 / dt2:", dt1.total_seconds() / dt2.total_seconds())

dt1 / dt2: 54.0816793680038


## Matrices

In [33]:
L = [[1,2], [3,4]]
L

[[1, 2], [3, 4]]

In [34]:
L[0]

[1, 2]

In [35]:
L[0][1]

2

In [37]:
A = np.array([[1,2], [3,4]])
A

array([[1, 2],
       [3, 4]])

In [38]:
A[0][1]

2

In [39]:
A[0,1]

2

In [40]:
A[:,0]

array([1, 3])

In [41]:
A.T

array([[1, 3],
       [2, 4]])

In [42]:
np.exp(A)

array([[ 2.71828183,  7.3890561 ],
       [20.08553692, 54.59815003]])

In [43]:
np.exp(L)

array([[ 2.71828183,  7.3890561 ],
       [20.08553692, 54.59815003]])

In [44]:
B = np.array([[1,2,3],[4,5,6]])
B

array([[1, 2, 3],
       [4, 5, 6]])

In [45]:
A.dot(B)

array([[ 9, 12, 15],
       [19, 26, 33]])

In [46]:
# error! inner dimensions must match
A.dot(B.T)

ValueError: shapes (2,2) and (3,2) not aligned: 2 (dim 1) != 3 (dim 0)

In [48]:
np.linalg.det(A)

-2.0000000000000004

In [49]:
np.linalg.inv(A)

array([[-2. ,  1. ],
       [ 1.5, -0.5]])

In [50]:
np.linalg.inv(A).dot(A)

array([[1.00000000e+00, 0.00000000e+00],
       [1.11022302e-16, 1.00000000e+00]])

In [51]:
np.trace(A)

5

In [52]:
np.diag(A)

array([1, 4])

In [53]:
np.diag([1, 4])

array([[1, 0],
       [0, 4]])

In [54]:
np.linalg.eig(A)

EigResult(eigenvalues=array([-0.37228132,  5.37228132]), eigenvectors=array([[-0.82456484, -0.41597356],
       [ 0.56576746, -0.90937671]]))

In [56]:
Lam, V = np.linalg.eig(A)

In [57]:
V[:,0] * Lam[0] == A @ V[:,0]

array([ True, False])

In [58]:
V[:,0] * Lam[0], A @ V[:,0]

(array([ 0.30697009, -0.21062466]), array([ 0.30697009, -0.21062466]))

In [59]:
np.allclose(V[:,0] * Lam[0], A @ V[:,0])

True

In [None]:
np.allclose(V @ np.diag(Lam), A @ V)

## Solving Linear Systems

The admission fee at a small fair is \$50 for children and \$4 for adults.
On a certain day, 2200 people enter the fair and \$5,050 is collected.
How many children and how many adults attended? 🤔

In [60]:
A = np.array([[1, 1], [1.5, 4]])
b = np.array([2200, 5050])

In [61]:
np.linalg.solve(A, b)

array([1500.,  700.])

In [62]:
# don't do this
np.linalg.inv(A).dot(b)

array([1500.,  700.])

## Generating Data

In [63]:
np.zeros((2, 3))

array([[0., 0., 0.],
       [0., 0., 0.]])

In [64]:
np.ones((2, 3))

array([[1., 1., 1.],
       [1., 1., 1.]])

In [65]:
10 * np.ones((2, 3))

array([[10., 10., 10.],
       [10., 10., 10.]])

In [66]:
np.eye(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [71]:
np.random.random()

0.6175568205154296

In [70]:
np.random.random((2, 3))

array([[0.92091954, 0.145741  , 0.59014316],
       [0.44266479, 0.85399735, 0.15597391]])

In [72]:
np.random.randn(2, 3)

array([[-0.80173426, -0.80784134,  1.25394236],
       [ 0.15905036,  1.95280769,  0.89519751]])

In [82]:
R = np.random.randn(10000)

In [83]:
R.mean()

-0.017621574749605007

In [84]:
np.mean(R)

-0.017621574749605007

In [85]:
R.var()

1.016285465208725

In [86]:
R = np.random.randn(10000, 3)

In [87]:
R.mean(axis=0)

array([-0.00086677, -0.00886433, -0.01101792])

In [88]:
R.mean(axis=1).shape

(10000,)

In [89]:
np.cov(R).shape

(10000, 10000)

In [90]:
np.cov(R.T)

array([[ 1.00663697, -0.00401198,  0.01841455],
       [-0.00401198,  0.99468023,  0.00404738],
       [ 0.01841455,  0.00404738,  1.00467069]])

In [91]:
np.cov(R, rowvar=False)

array([[ 1.00663697, -0.00401198,  0.01841455],
       [-0.00401198,  0.99468023,  0.00404738],
       [ 0.01841455,  0.00404738,  1.00467069]])

In [92]:
np.random.randint(0, 10, size=(3, 3))

array([[6, 0, 9],
       [6, 2, 5],
       [7, 0, 1]])

In [93]:
np.random.choice(10, size=(3, 3))

array([[9, 4, 5],
       [8, 2, 5],
       [9, 5, 1]])