In [1]:
import numpy as np

# NumPy Arrays

In [2]:
# NumPy arrays come in two formats, vectors and matricies
# Vectors are one dimensional arrays and matricies are multi-dimensional

In [3]:
# Creating a NumPy Array
my_list = [1,2,3]
x = np.array(my_list)

In [4]:
type(x)

numpy.ndarray

In [5]:
my_matrix= [[1,2,4], [4,5,6], [7,8,9]]

In [6]:
np.array(my_matrix)

array([[1, 2, 4],
       [4, 5, 6],
       [7, 8, 9]])

In [7]:
# Built in methods for arrays
list(range(0,5))

[0, 1, 2, 3, 4]

In [8]:
# The following results in the same output as above
np.arange(0,5)

array([0, 1, 2, 3, 4])

In [9]:
# similar to range, it has a start, stop, and step parameters
np.arange(1,11,2)

array([1, 3, 5, 7, 9])

In [10]:
# zeros() allows us to make a matrix of 0s
np.zeros(3)

array([ 0.,  0.,  0.])

In [11]:
# Here is how make the additional dimensions of 0s (index, columns)
np.zeros((3,4))

array([[ 0.,  0.,  0.,  0.],
       [ 0.,  0.,  0.,  0.],
       [ 0.,  0.,  0.,  0.]])

In [12]:
# same for ones
np.ones((3,6))

array([[ 1.,  1.,  1.,  1.,  1.,  1.],
       [ 1.,  1.,  1.,  1.,  1.,  1.],
       [ 1.,  1.,  1.,  1.,  1.,  1.]])

In [13]:
# returns evenly spaced numbers over the start and stop value
# third parameter is the number of values you want spaced between the start and stop value 
np.linspace(0,10,3)

array([  0.,   5.,  10.])

In [14]:
# this is an identity matrix, which is a square matrix 
# everything is zero except for the 1s which go diagonal
np.eye(3)

array([[ 1.,  0.,  0.],
       [ 0.,  1.,  0.],
       [ 0.,  0.,  1.]])

In [15]:
# Creating random numpy values - rand() is specifically 0-1.0
np.random.rand()

0.6926531560050913

In [16]:
# Same thing with making an array
np.random.rand(2,3)

array([[ 0.77588239,  0.28614475,  0.54617213],
       [ 0.8872554 ,  0.07211624,  0.66712148]])

In [17]:
# sampling from standard distribution (stdv) (gaussian distribution)
# return 5 numbers within a standard normal distribution
np.random.randn(5)

array([-0.78139227,  1.12520475,  0.21114218,  0.94504901,  0.01042469])

In [18]:
np.random.randn(5,4)

array([[ 0.64502775,  0.14959162, -0.35637063,  0.69698056],
       [ 0.66089056, -1.94098731, -1.59198734, -0.48293544],
       [-0.48866307, -0.14594121, -0.85350529, -1.7273126 ],
       [ 1.08929611, -1.34305636, -0.10615739,  0.79185467],
       [ 0.09873401,  0.17428438,  0.65747682, -0.66935453]])

In [19]:
# Random integer between two different points, and count of numbers
np.random.randint(1,100, 3)

array([62, 36, 17])

In [20]:
arr = np.arange(25)
ranarr = np.random.randint(0,50,10)

In [21]:
# Reshape method
arr

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14, 15, 16,
       17, 18, 19, 20, 21, 22, 23, 24])

In [22]:
# tuple has to be two numbers which multiply to the len(arr)
arr.reshape(5,5)

array([[ 0,  1,  2,  3,  4],
       [ 5,  6,  7,  8,  9],
       [10, 11, 12, 13, 14],
       [15, 16, 17, 18, 19],
       [20, 21, 22, 23, 24]])

In [23]:
# gives description on the shape of the array
arr.shape

(25,)

In [24]:
arr.reshape(5,5).shape

(5, 5)

In [25]:
ranarr

array([24, 33, 48, 20, 30,  4,  1, 38, 28, 13])

In [26]:
# index position of min and max
ranarr.argmin()

6

In [27]:
ranarr.argmax()

2

# Numpy Operations

In [28]:
arr = np.arange(0,10)
arr

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])

In [29]:
# operations will correspond to a given index position
arr + arr

array([ 0,  2,  4,  6,  8, 10, 12, 14, 16, 18])

In [30]:
arr * arr

array([ 0,  1,  4,  9, 16, 25, 36, 49, 64, 81])

In [31]:
arr - arr

array([0, 0, 0, 0, 0, 0, 0, 0, 0, 0])

In [32]:
# arr / arr - this will have 0/0

In [33]:
arr ** 3

array([  0,   1,   8,  27,  64, 125, 216, 343, 512, 729])

In [34]:
arr + 100

array([100, 101, 102, 103, 104, 105, 106, 107, 108, 109])

In [35]:
np.sqrt(arr)

array([ 0.        ,  1.        ,  1.41421356,  1.73205081,  2.        ,
        2.23606798,  2.44948974,  2.64575131,  2.82842712,  3.        ])

In [36]:
# power of 
np.exp(arr)

array([  1.00000000e+00,   2.71828183e+00,   7.38905610e+00,
         2.00855369e+01,   5.45981500e+01,   1.48413159e+02,
         4.03428793e+02,   1.09663316e+03,   2.98095799e+03,
         8.10308393e+03])

In [37]:
np.max(arr)

9

In [38]:
arr.max()

9

In [39]:
np.sin(arr)

array([ 0.        ,  0.84147098,  0.90929743,  0.14112001, -0.7568025 ,
       -0.95892427, -0.2794155 ,  0.6569866 ,  0.98935825,  0.41211849])

# Numpy Indexing and Selection

In [42]:
arr = np.arange(0,11)
arr

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10])

In [44]:
arr[4]

4

In [45]:
# Slice notation - up to, but not including
arr[1:4]

array([1, 2, 3])

In [46]:
arr[:5]

array([0, 1, 2, 3, 4])

In [47]:
arr[3:]

array([ 3,  4,  5,  6,  7,  8,  9, 10])

In [49]:
# Broadcasting, this is a special numpy functionality which allows you to reset the values of a given array
arr[0:5] = 100
arr

array([100, 100, 100, 100, 100,   5,   6,   7,   8,   9,  10])

In [55]:
arr = np.arange(0,11)

In [56]:
# Whenever we slice up pieces of an array, it simply acts as a pointer thus mutates the original array
slice_of_arr = arr[0:6]
slice_of_arr

array([0, 1, 2, 3, 4, 5])

In [57]:
slice_of_arr[:] = 99
slice_of_arr

array([99, 99, 99, 99, 99, 99])

In [58]:
arr

array([99, 99, 99, 99, 99, 99,  6,  7,  8,  9, 10])

In [59]:
# Here we now create a copy of the original array - this won't mutate the original 
arr_copy = arr.copy()
arr_copy

array([99, 99, 99, 99, 99, 99,  6,  7,  8,  9, 10])

In [61]:
arr_copy[:] = 200
arr_copy

array([200, 200, 200, 200, 200, 200, 200, 200, 200, 200, 200])

In [62]:
arr

array([99, 99, 99, 99, 99, 99,  6,  7,  8,  9, 10])

In [65]:
# Let's now take a look at indexing 2D arrays (matricies)
# mat[row,col]
# mat[row][col]
mat = np.array([[5,10,15],[20,25,30],[35,40,45]])
mat

array([[ 5, 10, 15],
       [20, 25, 30],
       [35, 40, 45]])

In [66]:
# Here let's index an entire row
mat[0]

array([ 5, 10, 15])

In [67]:
mat[1]

array([20, 25, 30])

In [68]:
# grab indiviual value - 2 ways
mat[1][1]

25

In [70]:
# this is the more common way 
mat[1,1]

25

In [71]:
mat[0,2]

15

In [74]:
# 2D array slicing
# this means, grab all the rows up to the 2 index, then grab the 1st index value until the end for each row
mat[:2,1:]

array([[10, 15],
       [25, 30]])

In [76]:
mat[1:,:2]

array([[20, 25],
       [35, 40]])

In [78]:
# Conditional Selection
arr = np.arange(1,11)
arr

array([ 1,  2,  3,  4,  5,  6,  7,  8,  9, 10])

In [79]:
# grab every element greater than 4
arr > 4

array([False, False, False, False,  True,  True,  True,  True,  True,  True], dtype=bool)

In [80]:
bool_arr = arr >4

In [81]:
arr[bool_arr]

array([ 5,  6,  7,  8,  9, 10])

In [83]:
# most common format for conditional selection
arr[arr>4]

array([ 5,  6,  7,  8,  9, 10])