## Arrays vs Lists

In [1]:
import numpy as np

In [2]:
L = [1, 2, 3]

In [3]:
A = np.array([1, 2, 3])

In [4]:
for e in L:
    print(e)

1
2
3


In [5]:
for e in A:
    print(e)

1
2
3


In [6]:
L.append(4)

In [7]:
L

[1, 2, 3, 4]

In [8]:
A.append(A)   # don't work

AttributeError: 'numpy.ndarray' object has no attribute 'append'

In [9]:
L + [5]

[1, 2, 3, 4, 5]

In [10]:
A + np.array([5])

array([6, 7, 8])

In [11]:
A + np.array([4, 5, 6])

array([5, 7, 9])

In [12]:
A + np.array([4, 5])  # don't work

ValueError: operands could not be broadcast together with shapes (3,) (2,) 

In [13]:
2 * A

array([2, 4, 6])

In [14]:
2 * L

[1, 2, 3, 4, 1, 2, 3, 4]

In [15]:
L + L

[1, 2, 3, 4, 1, 2, 3, 4]

In [16]:
L2 = []
for e in L:
    L2.append(e + 3)

In [17]:
L2

[4, 5, 6, 7]

In [18]:
L2 = [e + 3 for e in L]

In [19]:
L2

[4, 5, 6, 7]

In [20]:
L + 3   # don't work

TypeError: can only concatenate list (not "int") to list

In [21]:
A + 3

array([4, 5, 6])

In [22]:
L2 = []
for e in L:
    L2.append(e**2)

In [23]:
L2

[1, 4, 9, 16]

In [24]:
A ** 2

array([1, 4, 9])

In [25]:
np.sqrt(A)

array([1.        , 1.41421356, 1.73205081])

In [26]:
np.log(A)

array([0.        , 0.69314718, 1.09861229])

In [27]:
np.exp(A)

array([ 2.71828183,  7.3890561 , 20.08553692])

In [28]:
np.tanh(A)

array([0.76159416, 0.96402758, 0.99505475])

## The Dot Product

$$ a \cdot b = a^T b = \sum_{d=1}^D a_d b_d $$

In [29]:
a = np.array([1, 2])
b = np.array([3, 4])

In [30]:
dot = 0
for e, f in zip(a, b):
    dot += e * f
dot

11

In [31]:
dot = 0
for i in range(len(a)):
    dot += a[i] * b[i]
dot

11

In [32]:
a * b

array([3, 8])

In [33]:
np.sum(a * b)

11

In [34]:
(a * b).sum()

11

In [35]:
np.dot(a, b)

11

In [36]:
a.dot(b)

11

In [37]:
a @ b

11

$$ a^T b = \left\lVert a \right\rVert \left\lVert b \right\rVert \cos \theta_{ab}$$

$$ \cos \theta_{ab} = \frac{a^T b}{\left\lVert a \right\rVert \left\lVert b \right\rVert} $$

$$ \text{where} \left\lVert x \right\rVert = \sqrt{\sum_{d=1}^D x_d^2 } $$

In [38]:
amag = np.sqrt((a * a).sum())

In [39]:
amag

2.23606797749979

In [40]:
np.linalg.norm(a)

2.23606797749979

In [41]:
cosangle = a.dot(b) / (np.linalg.norm(a) * np.linalg.norm(b))

In [42]:
cosangle

0.9838699100999074

In [43]:
angle = np.arccos(cosangle)

In [44]:
angle

0.17985349979247847

## Speed Test

In [45]:
## speed comparison ##
from datetime import datetime

# note: you can algo use %timeit

a = np.random.randn(100)
b = np.random.randn(100)
T = 100_000

def slow_dot_product(a, b):
    results = 0
    for e, f in zip(a, b):
        results += e * f
    return results

t0 = datetime.now()
for t in range(T):
    slow_dot_product(a, b)
dt1 = datetime.now() - t0

t0 = datetime.now()
for t in range(T):
    a.dot(b)
dt2 = datetime.now() - t0

print(f"dt1/dt2: {dt1.total_seconds() / dt2.total_seconds()}!")

dt1/dt2: 30.772455886826894!


## Matrices

In [46]:
L = [[1, 2], [3, 4]]
L

[[1, 2], [3, 4]]

In [47]:
L[0]

[1, 2]

In [48]:
L[0][1]

2

In [49]:
A = np.array([[1, 2], [3, 4]])
A

array([[1, 2],
       [3, 4]])

In [50]:
A[0][1]

2

In [51]:
A[0,1]

2

In [52]:
A[:,0]

array([1, 3])

In [53]:
A.T

array([[1, 3],
       [2, 4]])

In [54]:
np.exp(A)

array([[ 2.71828183,  7.3890561 ],
       [20.08553692, 54.59815003]])

In [55]:
np.exp(L)

array([[ 2.71828183,  7.3890561 ],
       [20.08553692, 54.59815003]])

In [56]:
B = np.array([[1, 2, 3], [4, 5, 6]])
B

array([[1, 2, 3],
       [4, 5, 6]])

In [57]:
A.dot(B)

array([[ 9, 12, 15],
       [19, 26, 33]])

In [58]:
A.dot(B.T)

ValueError: shapes (2,2) and (3,2) not aligned: 2 (dim 1) != 3 (dim 0)

In [59]:
np.linalg.det(A)

-2.0000000000000004

In [60]:
np.linalg.inv(A)

array([[-2. ,  1. ],
       [ 1.5, -0.5]])

In [61]:
np.linalg.inv(A) * A

array([[-2. ,  2. ],
       [ 4.5, -2. ]])

In [62]:
np.linalg.inv(A).dot(A)

array([[1.0000000e+00, 4.4408921e-16],
       [0.0000000e+00, 1.0000000e+00]])

In [63]:
np.trace(A)

5

In [64]:
np.diag(A)

array([1, 4])

In [65]:
np.diag(np.diag(A))

array([[1, 0],
       [0, 4]])

In [66]:
np.linalg.eig(A)

(array([-0.37228132,  5.37228132]),
 array([[-0.82456484, -0.41597356],
        [ 0.56576746, -0.90937671]]))

In [67]:
Lam, V = np.linalg.eig(A)
Lam, V

(array([-0.37228132,  5.37228132]),
 array([[-0.82456484, -0.41597356],
        [ 0.56576746, -0.90937671]]))

In [68]:
V[:,0] * Lam[0] == A @ V[:,0]

array([ True, False])

In [69]:
V[:,0] * Lam[0], A @ V[:,0]

(array([ 0.30697009, -0.21062466]), array([ 0.30697009, -0.21062466]))

In [70]:
np.allclose(V[:,0] * Lam[0], A @ V[:,0])

True

In [71]:
np.allclose(V @ np.diag(Lam), A @ V)

True

## Solving Linear Systems

In [72]:
A = [[1, 1], [1.5, 4.0]]
b = [2200, 5050]

In [73]:
np.linalg.inv(A).dot(b)

array([1500.,  700.])

In [74]:
np.linalg.solve(A, b)

array([1500.,  700.])

## Generating Data

In [75]:
np.zeros((2, 3))

array([[0., 0., 0.],
       [0., 0., 0.]])

In [76]:
np.ones((2, 3))

array([[1., 1., 1.],
       [1., 1., 1.]])

In [77]:
10 * np.ones((2, 3))

array([[10., 10., 10.],
       [10., 10., 10.]])

In [78]:
np.eye(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [79]:
np.random.random()

0.9298645382399021

In [80]:
np.random.random((2, 3))

array([[0.48258795, 0.29816875, 0.60581982],
       [0.78741088, 0.52126447, 0.42287517]])

In [81]:
np.random.randn(2, 3)

array([[ 1.24329936,  0.99844327, -0.13458837],
       [-0.71582097, -0.10628099, -1.33702845]])

In [82]:
R = np.random.randn(10_000)

In [83]:
np.mean(R)

0.006092666679035349

In [84]:
R.mean()

0.006092666679035349

In [85]:
R.var()

1.0075475378435796

In [86]:
R.std()

1.0037666750015064

In [87]:
np.sqrt(R.var())

1.0037666750015064

In [88]:
R = np.random.randn(10_000, 3)

In [89]:
R.mean(axis=0)

array([-0.00312394, -0.0077288 , -0.01263443])

In [90]:
R.mean(axis=1)

array([-0.14887068,  0.99430345, -1.50873024, ..., -0.61270488,
        0.01760109,  0.31942229])

In [91]:
R.mean(axis=1).shape

(10000,)

In [92]:
np.cov(R).shape

(10000, 10000)

In [93]:
np.cov(R.T)

array([[ 0.99505219,  0.00706365, -0.0101146 ],
       [ 0.00706365,  1.0059272 , -0.01761487],
       [-0.0101146 , -0.01761487,  1.02602177]])

In [94]:
np.cov(R, rowvar=False)

array([[ 0.99505219,  0.00706365, -0.0101146 ],
       [ 0.00706365,  1.0059272 , -0.01761487],
       [-0.0101146 , -0.01761487,  1.02602177]])

In [95]:
np.random.randint(0, 10, size=(3, 3))

array([[9, 5, 9],
       [2, 6, 8],
       [6, 1, 6]])

## Exercise

In [96]:
## speed comparison ##
from datetime import datetime

# note: you can algo use %timeit

a = np.random.randn(100, 100)
b = np.random.randn(100, 100)
T = 200

def slow_matrix_product(a, b):
    results = results = np.zeros((a.shape[0], b.shape[1]))
    for i in range(a.shape[0]):
        for j in range(b.shape[1]):
            results[i, j] = a[i,:] @ b[:,j]
    return results

t0 = datetime.now()
for t in range(T):
    slow_matrix_product(a, b)
dt1 = datetime.now() - t0

t0 = datetime.now()
for t in range(T):
    a @ b
dt2 = datetime.now() - t0

print(f"dt1/dt2: {dt1.total_seconds() / dt2.total_seconds()}!")

dt1/dt2: 359.9025661587811!
