In [1]:
import numpy as np

In [6]:
# We can initialize numpy arrays from Python lists
a = np.array([1, 2, 3])   # Create a rank 1 array
print(type(a))            # Prints "<class 'numpy.ndarray'>"
a

<class 'numpy.ndarray'>


array([1, 2, 3])

In [7]:
print(a.shape)            # Prints "(3,)"

(3,)


In [7]:
# We can access elements using square brackets
print(a[0], a[1], a[2])   # Prints "1 2 3"

1 2 3


In [8]:
a[0] = 5                  # Change an element of the array
print(a)                  # Prints "[5, 2, 3]"

[5 2 3]


In [15]:
b = np.array([[1,2,3],[4,5,6]])    # Create a rank 2 array
print(b.shape)                     # Prints "(2, 3)"
print(b[0, 0], b[0, 1], b[1, 0])   # Prints "1 2 4"

w = [[1,2],[2,3]]
print(w[0][1])
print(type(w), type(b))
print(b.T)
w1 = np.array(w)
print(type(w1))

(2, 3)
1 2 4
2
<class 'list'> <class 'numpy.ndarray'>
[[1 4]
 [2 5]
 [3 6]]
<class 'numpy.ndarray'>


In [10]:
# Numpy also provides many functions to create arrays
a = np.zeros((2,2))   # Create an array of all zeros
print(a)              # Prints "[[ 0.  0.]
                      #          [ 0.  0.]]"

[[0. 0.]
 [0. 0.]]


In [11]:
b = np.ones((1,2))    # Create an array of all ones
print(b)              # Prints "[[ 1.  1.]]"

[[1. 1.]]


In [12]:
c = np.full((2,2), 7)  # Create a constant array
print(c)               # Prints "[[ 7.  7.]
                       #          [ 7.  7.]]"

[[7 7]
 [7 7]]


In [24]:
# Results are from the “continuous uniform” distribution over the stated interval
e = np.random.random((2,2))  # Create an array filled with random values
print(e)                     # Might print "[[ 0.91940167  0.08143941]
                             #               [ 0.68744134  0.87236687]]"


[[0.05150152 0.38372521]
 [0.72543606 0.64075992]]


In [20]:
# Slicing : Similar to Python lists, numpy arrays can be sliced. Since arrays may be multidimensional, 
# you must specify a slice for each dimension of the array.

# Create the following rank 2 array with shape (3, 4)
# [[ 1  2  3  4]
#  [ 5  6  7  8]
#  [ 9 10 11 12]]
a = np.array([[1,2,3,4], [5,6,7,8], [9,10,11,12]])
print(a)

# Use slicing to pull out the subarray consisting of the first 2 rows
# and columns 1 and 2; b is the following array of shape (2, 2):
# [[2 3]
#  [6 7]]
b = a[:2, 1:3] # Range is [L,R)
print(b)

[[ 1  2  3  4]
 [ 5  6  7  8]
 [ 9 10 11 12]]
[[2 3]
 [6 7]]


In [13]:
# A slice of an array is a view into the same data, so modifying it
# will modify the original array.
print(a[0, 1])   # Prints "2"
b[0, 0] = 77     # b[0, 0] is the same piece of data as a[0, 1]
print(a[0, 1])   # Prints "77"

2
77


In [27]:
# We can make the same distinction when accessing columns of an array:
col_r1 = a[:, 1]
print(col_r1, col_r1.shape)
col_r1[:, None].shape

[ 2  6 10] (3,)


(3, 1)

In [32]:
a = np.array([[1,2], [3, 4], [5, 6]])
print(a)

# Find all elements greater than 2
print(a[a > 2])     # Prints "[3 4 5 6]"

print(np.where(a>2))

# Python list equivalent -> Very slow as it uses double loop
a = [[1,2], [3, 4], [5, 6]]
for i in a:
    for j in i:
        if j > 2:
            print(j)

[[1 2]
 [3 4]
 [5 6]]
[3 4 5 6]
(array([1, 1, 2, 2], dtype=int64), array([0, 1, 0, 1], dtype=int64))
3
4
5
6


In [33]:
# Array Math
# Basic mathematical functions operate elementwise on arrays, 
# and are available both as operator overloads and as functions in the numpy module.

x = np.array([[1,2],[3,4]], dtype=np.float64)
y = np.array([[5,6],[7,8]], dtype=np.float64)

# Elementwise sum; both produce the array
# [[ 6.0  8.0]
#  [10.0 12.0]]
print(x + y)
print(np.add(x, y))

# Elementwise difference; both produce the array
# [[-4.0 -4.0]
#  [-4.0 -4.0]]
print(x - y)
print(np.subtract(x, y))

# Elementwise product; both produce the array
# [[ 5.0 12.0]
#  [21.0 32.0]]
print(x * y)
print(np.multiply(x, y))

# Elementwise division; both produce the array
# [[ 0.2         0.33333333]
#  [ 0.42857143  0.5       ]]
print(x / y)
print(np.divide(x, y))

# Elementwise square root; produces the array
# [[ 1.          1.41421356]
#  [ 1.73205081  2.        ]]
print(np.sqrt(x))

[[ 6.  8.]
 [10. 12.]]
[[ 6.  8.]
 [10. 12.]]
[[-4. -4.]
 [-4. -4.]]
[[-4. -4.]
 [-4. -4.]]
[[ 5. 12.]
 [21. 32.]]
[[ 5. 12.]
 [21. 32.]]
[[0.2        0.33333333]
 [0.42857143 0.5       ]]
[[0.2        0.33333333]
 [0.42857143 0.5       ]]
[[1.         1.41421356]
 [1.73205081 2.        ]]


In [21]:
#  We instead use the dot function to compute inner products of vectors, 
# to multiply a vector by a matrix, and to multiply matrices.

x = np.array([[1,2],[3,4]])
y = np.array([[5,6],[7,8]])

v = np.array([9,10])
w = np.array([11, 12])

# Inner product of vectors; both produce 219
print(v.dot(w))
print(np.dot(v, w))

# Matrix / vector product; both produce the rank 1 array [29 67]
print(x.dot(v))
print(np.dot(x, v))

# Matrix / matrix product; both produce the rank 2 array
# [[19 22]
#  [43 50]]
print(x.dot(y))
print(np.dot(x, y))

219
219
[29 67]
[29 67]
[[19 22]
 [43 50]]
[[19 22]
 [43 50]]


In [34]:
# Numpy provides many useful functions for performing computations on arrays; 
# one of the most useful is sum:

x = np.array([[1,2],[3,4]])

print(np.sum(x))  # Compute sum of all elements; prints "10"
print(np.mean(x, axis=0))  # Compute sum of each column; prints "[4 6]"
print(np.mean(x, axis=1))  # Compute sum of each row; prints "[3 7]"

10
[2. 3.]
[1.5 3.5]


In [23]:
# Transpose of a matrix

x = np.array([[1,2], [3,4]])
print(x)    # Prints "[[1 2]
            #          [3 4]]"
print(x.T)  # Prints "[[1 3]
            #          [2 4]]"

# Note that taking the transpose of a rank 1 array does nothing:
# i.e. no concept of horizontal or vertical vector. (You have to add one more dimension to achieve it!)
v = np.array([1,2,3])
print(v)    # Prints "[1 2 3]"
print(v.T)  # Prints "[1 2 3]"

[[1 2]
 [3 4]]
[[1 3]
 [2 4]]
[1 2 3]
[1 2 3]


In [35]:
from datetime import datetime

# Numpy arrays are fast. Very fast.
# Let's create a random numpy matrix of values between 0 and 1
mat_num = np.random.random((2000, 2000))
mat_pyt = mat_num.tolist()

# We will find the indices of all numbers greater than 0.95
# Let's time our numpy method first
startTime = datetime.now()
print(np.sum(mat_num[mat_num > 0.95]))
print(datetime.now() - startTime)

# Let's time our python list method now
startTime = datetime.now()
total_sum = 0
for i in mat_pyt:
    for j in i:
        if j > 0.95:
            total_sum+= j
print(total_sum)
print(datetime.now() - startTime)

195095.5606316168
0:00:00.010959
195095.56063161968
0:00:00.221380
