In [1]:
import numpy as np

*Lists are slower since they have 4 attributes for each data.

    1. Size ( 4 bytes for integers )
    2. Reference Count  ( 8 bytes for integers )
    3. Object type  ( 8 bytes for integers )
    4. Object value ( 8 bytes for integers )
    
*Lists are not contiguous 
    1. Pointers to each memory location.
    2. partial loading of memory blocks.
    
*Type checking for each element.


*Numpy have only object value and can be changed to int64,32,16,8

*No type checking in numpy

*Numpy uses contiguous memory

    1. Uses Single Instruction Multiple Data ( SIMD Vector Processing )
    2. Effective Cache Utilization.
    
 

## The Basics

In [3]:
# The following one line multiplication is not allowed in lists but allowed in arrays.
try:
    a = [1,2,3]
    b = [4,5,6]
    print(a*b)
except:
    print("Not allowed in lists")

# This is allowed

a = np.array([1,2,3])
b = np.array([4,5,6])
print(a*b)

Not allowed in lists
[ 4 10 18]


In [4]:
# Create 1D array
a = np.array([1,2,3])
print(a)

[1 2 3]


In [5]:
# Create 2D array
b = np.array([[9.0,8.0,7.0], [11.0,10.0,9.0]])

In [6]:
#Get dimensions
a.ndim

1

In [7]:
b.ndim

2

In [8]:
#Get shape
a.shape   # vector

(3,)

In [9]:
b.shape

(2, 3)

In [10]:
#Get Type
a.dtype

dtype('int32')

In [11]:
b.dtype

dtype('float64')

In [12]:
# Change dtype
c = np.array([1,2,3], dtype='int16')
c.dtype

dtype('int16')

In [16]:
# Get size of each element
a.itemsize

4

In [17]:
b.itemsize

8

In [18]:
c.itemsize

2

In [20]:
# Get size of array ( number of elements)
a.size

3

In [21]:
# Get total size
a.size * a.itemsize

12

In [22]:
# Get total size (alternatively)
a.nbytes

12

# Acessing/ Changing specific elements, rows, columns etc

In [23]:
a = np.array([[1,2,3,4,5,6,7],[8,9,10,11,12,13,14]])
print(a)

[[ 1  2  3  4  5  6  7]
 [ 8  9 10 11 12 13 14]]


In [24]:
# get specific elements [r,c]
a[1,5]

13

In [26]:
# get specific row ( example index position 0 and all columns)
a[0,:]

array([1, 2, 3, 4, 5, 6, 7])

In [27]:
# get specific column and all rows
a[:,2]

array([ 3, 10])

In [28]:
# getting a little more fancy [ startindex:endindex:stepsize]
a[0, 1:-1:2]

array([2, 4, 6])

In [30]:
# change values in the matrices
a[1,5] = 20
print(a)

[[ 1  2  3  4  5  6  7]
 [ 8  9 10 11 12 20 14]]


In [31]:
# change the columns in each row to a specific value
a[:,2]= 99
print(a)

[[ 1  2 99  4  5  6  7]
 [ 8  9 99 11 12 20 14]]


In [32]:
# change the columns in each row with different numbers
a[:,2]= [100,200]
print(a)

[[  1   2 100   4   5   6   7]
 [  8   9 200  11  12  20  14]]


# 3D examples

In [34]:
b = np.array([[[1,2],[3,4]],[[5,6],[7,8]]])
print(b)

[[[1 2]
  [3 4]]

 [[5 6]
  [7 8]]]


In [35]:
b[0,0,1]

2

In [36]:
b[:,1,:]    # [r,c,l]

array([[3, 4],
       [7, 8]])

In [38]:
# replace segments
b[:,1,:] = [[9,9],[8,8]]
print(b)

[[[1 2]
  [9 9]]

 [[5 6]
  [8 8]]]


# Initializing different types of array

## All zeroes

In [39]:
np.zeros(5)

array([0., 0., 0., 0., 0.])

In [40]:
np.zeros((2,3))

array([[0., 0., 0.],
       [0., 0., 0.]])

In [41]:
np.zeros((2,3,3))

array([[[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]],

       [[0., 0., 0.],
        [0., 0., 0.],
        [0., 0., 0.]]])

In [42]:
np.zeros((2,3,3,4))

array([[[[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]],

        [[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]],

        [[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]]],


       [[[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]],

        [[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]],

        [[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]]]])

## All 1s matrix

In [45]:
np.ones((4,5,3), dtype='int32')

array([[[1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1]],

       [[1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1]],

       [[1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1]],

       [[1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1],
        [1, 1, 1]]])

## any number

In [46]:
np.full((2,2),99, dtype = 'float32')

array([[99., 99.],
       [99., 99.]], dtype=float32)

In [47]:
# any other number using previous shape(full_like)
a.shape
np.full_like(a,4)

array([[4, 4, 4, 4, 4, 4, 4],
       [4, 4, 4, 4, 4, 4, 4]])

In [48]:
# random decimal numbers
np.random.rand(4,2)

array([[0.08880604, 0.50269916],
       [0.74098586, 0.39954873],
       [0.78881876, 0.94706066],
       [0.94490052, 0.16288698]])

In [49]:
np.random.random_sample(a.shape)

array([[0.45399463, 0.02987765, 0.9008056 , 0.39397158, 0.17839776,
        0.30268918, 0.83041705],
       [0.32612946, 0.51065575, 0.69454284, 0.35251433, 0.09637707,
        0.91838423, 0.17782828]])

In [50]:
# random integer values
np.random.randint(7)

6

In [51]:
np.random.randint(-4,7, size = (3,3))

array([[ 6, -2,  3],
       [ 3,  6,  1],
       [ 0,  4,  0]])

In [52]:
# identity matrix
np.identity(5)

array([[1., 0., 0., 0., 0.],
       [0., 1., 0., 0., 0.],
       [0., 0., 1., 0., 0.],
       [0., 0., 0., 1., 0.],
       [0., 0., 0., 0., 1.]])

In [55]:
# repeat an array
arr = np.array([1,2,3])
r1 = np.repeat(arr,3, axis = 0)
print(r1)

[1 1 1 2 2 2 3 3 3]


In [56]:
arr = np.array([[1,2,3]])
r1 = np.repeat(arr,3, axis = 0)
print(r1)

[[1 2 3]
 [1 2 3]
 [1 2 3]]


In [57]:
arr = np.array([[1,2,3]])
r1 = np.repeat(arr,3, axis = 1)
print(r1)

[[1 1 1 2 2 2 3 3 3]]


# example problem
![image.png](attachment:image.png)

## Solution

In [59]:
new_arr = np.full((5,5),1)
new_arr[1:-1,1:-1] = 0
new_arr[new_arr.shape[0]//2,new_arr.shape[0]//2] = 9
print(new_arr)

[[1 1 1 1 1]
 [1 0 0 0 1]
 [1 0 9 0 1]
 [1 0 0 0 1]
 [1 1 1 1 1]]


# Alternate solution

In [60]:
output = np.ones((5,5))
z = np.zeros((3,3))
z[1,1] = 9
output[1:-1,1:-1] = z
print(output)

[[1. 1. 1. 1. 1.]
 [1. 0. 0. 0. 1.]
 [1. 0. 9. 0. 1.]
 [1. 0. 0. 0. 1.]
 [1. 1. 1. 1. 1.]]


# be careful when copying array!!

In [61]:
a = np.array([1,2,3])
b = a
b

array([1, 2, 3])

In [62]:
b[0]=100
print(a)
print(b)

# changes are reflected on 'a' as well. We did not copy values but instead created a reference!!

[100   2   3]
[100   2   3]


In [63]:
# use this instead 
b = a.copy()
b[0] = 200
print(a)
print(b)

[100   2   3]
[200   2   3]


# Mathematics

In [64]:
a = np.array([1,2,3,4])
print(a)

[1 2 3 4]


In [65]:
a+=2
print(a)

a = a-2
print(a)

a = a*2
print(a)

a = a/2
print(a)

[3 4 5 6]
[1 2 3 4]
[2 4 6 8]
[1. 2. 3. 4.]


In [66]:
b = np.array([1,0,1,0])
a+b

array([2., 2., 4., 4.])

In [67]:
a**2

array([ 1.,  4.,  9., 16.])

In [68]:
print(np.sin(a))
print(np.cos(a))

[ 0.84147098  0.90929743  0.14112001 -0.7568025 ]
[ 0.54030231 -0.41614684 -0.9899925  -0.65364362]


## Linear Algebra

In [69]:
a = np.ones((2,3))
print(a)
b = np.full((3,2),2)
print(b)

[[1. 1. 1.]
 [1. 1. 1.]]
[[2 2]
 [2 2]
 [2 2]]


In [70]:
try:
    a*b # does not work because of different dimensions
except:
    print(np.matmul(a,b))

[[6. 6.]
 [6. 6.]]


In [71]:
# find determinant
c = np.identity(3)
np.linalg.det(c)

1.0

# Statistics

In [72]:
stats = np.array([[1,2,3],[4,5,6]])
stats

array([[1, 2, 3],
       [4, 5, 6]])

In [73]:
np.min(stats)

1

In [74]:
np.min(stats, axis=1)

array([1, 4])

In [75]:
np.min(stats, axis=0)

array([1, 2, 3])

In [76]:
np.max(stats)

6

In [77]:
np.mean(stats)

3.5

In [78]:
np.sum(stats)

21

In [79]:
np.sum(stats, axis = 0)

array([5, 7, 9])

In [80]:
np.sum(stats, axis = 1)

array([ 6, 15])

# Reorganizing arrays

In [81]:
before = np.array([[1,2,3,4],[5,6,7,8]])
print(before)

after = before.reshape((8,1))
print(after)

after = before.reshape((4,2))
print(after)

after = before.reshape((2,2,2))
print(after)

[[1 2 3 4]
 [5 6 7 8]]
[[1]
 [2]
 [3]
 [4]
 [5]
 [6]
 [7]
 [8]]
[[1 2]
 [3 4]
 [5 6]
 [7 8]]
[[[1 2]
  [3 4]]

 [[5 6]
  [7 8]]]


In [82]:
# Vertically stack vectors
v1 = np.array([1,2,3,4])
v2 = np.array([5,6,7,8])
np.vstack([v1,v2,v1,v2])

array([[1, 2, 3, 4],
       [5, 6, 7, 8],
       [1, 2, 3, 4],
       [5, 6, 7, 8]])

In [83]:
# Horizontal stack
np.hstack([v1,v2,v1,v2])

array([1, 2, 3, 4, 5, 6, 7, 8, 1, 2, 3, 4, 5, 6, 7, 8])

# Miscellaneous

In [84]:
# load data from files
filedata = np.genfromtxt('npdata.txt',delimiter = ',')

In [85]:
# change dtype
filedata = filedata.astype('int32')

In [86]:
filedata

array([[ 1,  2,  3,  4,  5,  6,  7,  8,  1,  2,  3,  4,  5,  6,  7,  8],
       [ 3,  5,  7,  8,  9, 11,  8,  7,  3,  5,  7,  8,  9, 11,  8,  7]])

#### Boolean masking and advanced indexing

In [87]:
filedata > 2

array([[False, False,  True,  True,  True,  True,  True,  True, False,
        False,  True,  True,  True,  True,  True,  True],
       [ True,  True,  True,  True,  True,  True,  True,  True,  True,
         True,  True,  True,  True,  True,  True,  True]])

In [88]:
filedata[filedata>4]

array([ 5,  6,  7,  8,  5,  6,  7,  8,  5,  7,  8,  9, 11,  8,  7,  5,  7,
        8,  9, 11,  8,  7])

In [89]:
# you can index with a list in numpy
a = np.array([1,2,3,4,5,6,7,8,9])
a[[1,2,8]]

array([2, 3, 9])

In [90]:
np.any(filedata> 5, axis = 0)

array([False, False,  True,  True,  True,  True,  True,  True, False,
       False,  True,  True,  True,  True,  True,  True])

In [91]:
np.all(filedata> 5, axis = 0)

array([False, False, False, False, False,  True,  True,  True, False,
       False, False, False, False,  True,  True,  True])

In [92]:
np.any(filedata> 5, axis = 1)

array([ True,  True])

In [93]:
((filedata> 5) & (filedata< 7))

array([[False, False, False, False, False,  True, False, False, False,
        False, False, False, False,  True, False, False],
       [False, False, False, False, False, False, False, False, False,
        False, False, False, False, False, False, False]])

In [94]:
(~(filedata> 5) & (filedata< 7))

array([[ True,  True,  True,  True,  True, False, False, False,  True,
         True,  True,  True,  True, False, False, False],
       [ True,  True, False, False, False, False, False, False,  True,
         True, False, False, False, False, False, False]])