## Introduction to Numpy

In [318]:
import sys 
import numpy as np

#### Basic Numpy Arrays

In [319]:
np.array([1,2,3,4])

array([1, 2, 3, 4])

In [320]:
a = np.array([1, 2, 3, 4])

In [321]:
a[0], a[1]


(1, 2)

In [322]:
a[0:]

array([1, 2, 3, 4])

In [323]:
a[1:3]

array([2, 3])

In [324]:
a[1:-1]

array([2, 3])

In [325]:
a[::2]


array([1, 3])

In [326]:
a

array([1, 2, 3, 4])

In [327]:
b = np.array([0, .5, 1, 1.5, 2])


In [328]:
b

array([0. , 0.5, 1. , 1.5, 2. ])

In [329]:
b[0], b[2], b[-1]

(0.0, 1.0, 2.0)

#### Array Types

In [330]:
a.dtype

dtype('int32')

In [331]:
b.dtype

dtype('float64')

In [332]:
np.array([1, 2, 3, 4], dtype=np.float)


array([1., 2., 3., 4.])

In [333]:
np.array([1, 2, 3, 4], dtype=np.int8)


array([1, 2, 3, 4], dtype=int8)

In [334]:
c = np.array(['a', 'b', 'c'])


In [335]:
c.dtype


dtype('<U1')

In [336]:
d = np.array([{'a': 1}, sys])


In [337]:
d.dtype


dtype('O')

#### Dimensions and shapes

In [338]:
A = np.array([
    [1, 2, 3],
    [4, 5, 6]
])

In [339]:
A.shape


(2, 3)

In [340]:
A.ndim

2

In [341]:
A.size

6

In [342]:
B = np.array([
    [
        [12, 11, 10],
        [9, 8, 7],
    ],
    [
        [6, 5, 4],
        [3, 2, 1]
    ]
])

In [343]:
B

array([[[12, 11, 10],
        [ 9,  8,  7]],

       [[ 6,  5,  4],
        [ 3,  2,  1]]])

In [344]:
B.shape

(2, 2, 3)

In [345]:
B.ndim


3

In [346]:
B.size


12

In [347]:
C = np.array([
    [
        [12, 11, 10],
        [9, 8, 7],
    ],
    [
        [6, 5, 4]
    ]
])

  C = np.array([


In [348]:
C.dtype

dtype('O')

In [349]:
C.shape


(2,)

In [350]:
C.size


2

In [351]:
type(C[0])


list

#### Indexing and Slicing of Matrices

In [352]:
# Square matrix
A = np.array([
#.   0. 1. 2
    [1, 2, 3], # 0
    [4, 5, 6], # 1
    [7, 8, 9]  # 2
])

In [353]:
A[1]

array([4, 5, 6])

In [354]:
A[1][0]

4

In [355]:
# A[d1, d2, d3, d4]


In [356]:
A[1, 0]


4

In [357]:
A[0:2]

array([[1, 2, 3],
       [4, 5, 6]])

In [358]:
A[:, :2]

array([[1, 2],
       [4, 5],
       [7, 8]])

In [359]:
A[:2, :2]

array([[1, 2],
       [4, 5]])

In [360]:
A[:2, 2:]

array([[3],
       [6]])

In [361]:
A

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

In [362]:
A[1] = np.array([10, 10, 10])

In [363]:
A

array([[ 1,  2,  3],
       [10, 10, 10],
       [ 7,  8,  9]])

In [364]:
A[2] = 99

In [365]:
A


array([[ 1,  2,  3],
       [10, 10, 10],
       [99, 99, 99]])

#### Summary Statistics


In [366]:
a = np.array([1, 2, 3, 4])

In [367]:
a.sum()

10

In [368]:
a.mean()

2.5

In [369]:
a.std()

1.118033988749895

In [370]:
a.var()

1.25

In [371]:
A.sum()

333

In [372]:
A.mean()

37.0

In [373]:
A.std()

43.96463225012679

In [374]:
A.sum(axis=0)

array([110, 111, 112])

In [375]:
A.sum(axis=1)

array([  6,  30, 297])

In [376]:
A.mean(axis=0)

array([36.66666667, 37.        , 37.33333333])

In [377]:
A.mean(axis=1)

array([ 2., 10., 99.])

In [378]:
A.std(axis=0)

array([44.22920101, 43.96210489, 43.69846171])

In [379]:
A.std(axis=1)

array([0.81649658, 0.        , 0.        ])

#### Broadcasting and Vectorized operations

In [380]:
a = np.arange(4)

In [381]:
a + 10

array([10, 11, 12, 13])

In [382]:
a * 10

array([ 0, 10, 20, 30])

In [383]:
a

array([0, 1, 2, 3])

In [384]:
a += 100

In [385]:
a

array([100, 101, 102, 103])

In [386]:
l = [0, 1, 2, 3]

In [387]:
[i * 10 for i in l]


[0, 10, 20, 30]

In [388]:
a = np.arange(4)


In [389]:
a


array([0, 1, 2, 3])

In [390]:
b = np.array([10, 10, 10, 10])


In [391]:
b


array([10, 10, 10, 10])

In [392]:
a + b

array([10, 11, 12, 13])

In [393]:
a * b

array([ 0, 10, 20, 30])

#### Boolean arrays

In [394]:
a = np.arange(4)


In [395]:
a

array([0, 1, 2, 3])

In [396]:
a[0], a[-1]


(0, 3)

In [397]:
a[[0, -1]]


array([0, 3])

In [398]:
a[[True, False, False, True]]


array([0, 3])

In [399]:
a


array([0, 1, 2, 3])

In [400]:
a >= 2


array([False, False,  True,  True])

In [401]:
a[a >= 2]


array([2, 3])

In [402]:
a.mean()


1.5

In [403]:
a[a > a.mean()]


array([2, 3])

In [404]:
a[~(a > a.mean())]


array([0, 1])

In [405]:
a[(a == 0) | (a == 1)]


array([0, 1])

In [406]:
a[(a <= 2) & (a % 2 == 0)]


array([0, 2])

In [407]:
A = np.random.randint(100, size=(3, 3))


In [408]:
A

array([[98, 42, 99],
       [90, 88, 42],
       [98, 32, 14]])

In [409]:
A[np.array([
    [True, False, True],
    [False, True, False],
    [True, False, True]
])]

array([98, 99, 88, 98, 14])

In [410]:
A > 30

array([[ True,  True,  True],
       [ True,  True,  True],
       [ True,  True, False]])

In [411]:
A[A > 30]


array([98, 42, 99, 90, 88, 42, 98, 32])

#### Linear Algebra

In [412]:
A = np.array([
    [1, 2, 3],
    [4, 5, 6],
    [7, 8, 9]
])

In [413]:
B = np.array([
    [6, 5],
    [4, 3],
    [2, 1]
])

In [414]:
A.dot(B)

array([[20, 14],
       [56, 41],
       [92, 68]])

In [415]:
A @ B

array([[20, 14],
       [56, 41],
       [92, 68]])

In [416]:
B.T

array([[6, 4, 2],
       [5, 3, 1]])

In [417]:
A

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

In [418]:
B.T @ A

array([[36, 48, 60],
       [24, 33, 42]])

#### Size of objects in Memory


#### Int, floats

In [419]:
# An integer in Python is > 24bytes
sys.getsizeof(1)

28

In [420]:
# Longs are even larger
sys.getsizeof(10**100)

72

In [421]:
# Numpy size is much smaller
np.dtype(int).itemsize

4

In [422]:
# Numpy size is much smaller
np.dtype(np.int8).itemsize

1

In [423]:
np.dtype(float).itemsize


8

#### Lists are even larger

In [424]:
# A one-element list
sys.getsizeof([1])

64

In [425]:
# An array of one element in numpy
np.array([1]).nbytes

4

#### And performance is also importan

In [426]:
l = list(range(100000))

In [427]:
a = np.arange(100000)

In [428]:
%time np.sum(a ** 2)


Wall time: 7.97 ms


216474736

In [429]:
%time sum([x ** 2 for x in l])


Wall time: 79.9 ms


333328333350000

#### Useful Numpy functions

#### random

In [430]:
np.random.random(size=2)


array([0.02480256, 0.3083126 ])

In [431]:
np.random.normal(size=2)


array([-0.11335684, -1.42553019])

In [432]:
np.random.rand(2, 4)


array([[0.50979541, 0.96786169, 0.85312753, 0.91044669],
       [0.59121849, 0.68486184, 0.6010195 , 0.49706204]])

#### arange

In [433]:
np.arange(10)

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])

In [434]:
np.arange(5, 10)

array([5, 6, 7, 8, 9])

In [435]:
np.arange(0, 1, .1)

array([0. , 0.1, 0.2, 0.3, 0.4, 0.5, 0.6, 0.7, 0.8, 0.9])

####  reshape

In [436]:
np.arange(10).reshape(2, 5)

array([[0, 1, 2, 3, 4],
       [5, 6, 7, 8, 9]])

In [437]:
np.arange(10).reshape(5, 2)

array([[0, 1],
       [2, 3],
       [4, 5],
       [6, 7],
       [8, 9]])

#### linspace

In [438]:
np.linspace(0, 1, 5)

array([0.  , 0.25, 0.5 , 0.75, 1.  ])

In [439]:
np.linspace(0, 1, 20)

array([0.        , 0.05263158, 0.10526316, 0.15789474, 0.21052632,
       0.26315789, 0.31578947, 0.36842105, 0.42105263, 0.47368421,
       0.52631579, 0.57894737, 0.63157895, 0.68421053, 0.73684211,
       0.78947368, 0.84210526, 0.89473684, 0.94736842, 1.        ])

In [440]:
np.linspace(0, 1, 20, False)


array([0.  , 0.05, 0.1 , 0.15, 0.2 , 0.25, 0.3 , 0.35, 0.4 , 0.45, 0.5 ,
       0.55, 0.6 , 0.65, 0.7 , 0.75, 0.8 , 0.85, 0.9 , 0.95])

####  zeros, ones, empty

In [441]:
np.zeros(5)

array([0., 0., 0., 0., 0.])

In [442]:
np.zeros((3, 3))

array([[0., 0., 0.],
       [0., 0., 0.],
       [0., 0., 0.]])

In [443]:
np.zeros((3, 3), dtype=np.int)

array([[0, 0, 0],
       [0, 0, 0],
       [0, 0, 0]])

In [444]:
np.ones(5)

array([1., 1., 1., 1., 1.])

In [445]:
np.ones((3, 3))

array([[1., 1., 1.],
       [1., 1., 1.],
       [1., 1., 1.]])

In [446]:
np.empty(5)

array([1., 1., 1., 1., 1.])

In [447]:
np.empty((2, 2))

array([[0.25, 0.5 ],
       [0.75, 1.  ]])

#### identity and eye

In [448]:
np.identity(3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [449]:
np.eye(3, 3)

array([[1., 0., 0.],
       [0., 1., 0.],
       [0., 0., 1.]])

In [450]:
np.eye(8, 4)

array([[1., 0., 0., 0.],
       [0., 1., 0., 0.],
       [0., 0., 1., 0.],
       [0., 0., 0., 1.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.]])

In [451]:
np.eye(8, 4, k=1)

array([[0., 1., 0., 0.],
       [0., 0., 1., 0.],
       [0., 0., 0., 1.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.]])

In [452]:
np.eye(8, 4, k=-3)

array([[0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [0., 0., 0., 0.],
       [1., 0., 0., 0.],
       [0., 1., 0., 0.],
       [0., 0., 1., 0.],
       [0., 0., 0., 1.],
       [0., 0., 0., 0.]])

In [453]:
"Hello World"[6]

'W'