# 4  NumPy Basics: Arrays and Vectorized Computation

In [1]:
import numpy as np

elems = 10**6
np_arr = np.arange(elems)
l_arr = list(range(elems))


#### computational comparation of np.array and list

In [2]:
%time for _ in range(10): np_arr * 2 

CPU times: user 19.5 ms, sys: 3.88 ms, total: 23.4 ms
Wall time: 22.7 ms


In [3]:
%time for _ in range(10): [x * 2 for x in l_arr]

CPU times: user 525 ms, sys: 115 ms, total: 641 ms
Wall time: 643 ms


## Multidimensional array

In [4]:
import numpy as np

In [5]:
data = np.random.randn(2,3) # normal distribution
data 

array([[ 0.42846392, -0.05377925, -0.6987901 ],
       [ 0.96560994, -1.1956351 , -0.08666424]])

In [6]:
mu = 3000
sigma = 10
data * sigma + mu # normal distribution

array([[3004.28463919, 2999.4622075 , 2993.01209897],
       [3009.65609942, 2988.04364898, 2999.13335755]])

In [7]:
data + data

array([[ 0.85692784, -0.1075585 , -1.39758021],
       [ 1.93121988, -2.3912702 , -0.17332849]])

In [8]:
data.shape

(2, 3)

In [9]:
data.dtype

dtype('float64')

In [10]:
type(data)

numpy.ndarray

## Creating an ndarray

In [11]:
data_l = [1,2,3.3,4.4]
data_np = np.array(data_l)
print(data_np.shape)
print(data_np.dtype)
print(data_np.ndim)
data_np

(4,)
float64
1


array([1. , 2. , 3.3, 4.4])

In [12]:
data_l = [[1,2,3.3,4.4], [5,6,7,8]]
data_np = np.array(data_l)
print(data_np.shape)
print(data_np.dtype)
print(data_np.ndim)
data_np

(2, 4)
float64
2


array([[1. , 2. , 3.3, 4.4],
       [5. , 6. , 7. , 8. ]])

In [13]:
np.zeros((3, 10))

array([[0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0., 0., 0., 0., 0., 0.],
       [0., 0., 0., 0., 0., 0., 0., 0., 0., 0.]])

In [14]:
np.empty((2, 3, 1)) # garbage vals

array([[[0.85692784],
        [0.1075585 ],
        [1.39758021]],

       [[1.93121988],
        [2.3912702 ],
        [0.17332849]]])

In [15]:
np.ones(5)

array([1., 1., 1., 1., 1.])

In [16]:
np.arange(15)

array([ 0,  1,  2,  3,  4,  5,  6,  7,  8,  9, 10, 11, 12, 13, 14])

In [17]:
np.eye(5)

array([[1., 0., 0., 0., 0.],
       [0., 1., 0., 0., 0.],
       [0., 0., 1., 0., 0.],
       [0., 0., 0., 1., 0.],
       [0., 0., 0., 0., 1.]])

In [18]:
np.full_like(data_np, np.nan)

array([[nan, nan, nan, nan],
       [nan, nan, nan, nan]])

In [19]:
my_array1 = np.array([1,2,3.,4.])
my_array2 = np.array([1,2,3.,4.], dtype='int32')

In [20]:
print(my_array1.dtype)
print(my_array2.dtype)

float64
int32


## np.astype()

In [21]:
my_array1.astype('int32')

array([1, 2, 3, 4], dtype=int32)

## Arithmetic with NumPy Arrays

In [22]:
arr = np.array([[1,2,3],[4,5,6.]], dtype='float64')
arr.dtype

dtype('float64')

In [23]:
arr + arr

array([[ 2.,  4.,  6.],
       [ 8., 10., 12.]])

In [24]:
arr * arr # No hace el cálculo matricial

array([[ 1.,  4.,  9.],
       [16., 25., 36.]])

In [25]:
arr - arr

array([[0., 0., 0.],
       [0., 0., 0.]])

In [26]:
arr/arr

array([[1., 1., 1.],
       [1., 1., 1.]])

In [27]:
1/arr

array([[1.        , 0.5       , 0.33333333],
       [0.25      , 0.2       , 0.16666667]])

In [28]:
arr**2

array([[ 1.,  4.,  9.],
       [16., 25., 36.]])

In [29]:
arr ** 0.5

array([[1.        , 1.41421356, 1.73205081],
       [2.        , 2.23606798, 2.44948974]])

In [30]:
arr2 = 3*arr
arr2

array([[ 3.,  6.,  9.],
       [12., 15., 18.]])

In [31]:
arr2>arr

array([[ True,  True,  True],
       [ True,  True,  True]])

In [32]:
arr2<arr

array([[False, False, False],
       [False, False, False]])

## Basic indexing and slicing

In [33]:
arr = np.arange(5)

In [34]:
arr

array([0, 1, 2, 3, 4])

In [35]:
arr[2]

2

In [36]:
arr[3:]

array([3, 4])

In [37]:
len(arr)

5

In [38]:
arr[3:4]

array([3])

In [39]:
arr[2:5] = 33

In [40]:
arr

array([ 0,  1, 33, 33, 33])

In [41]:
arr2 = arr[0:2]
arr2

array([0, 1])

In [42]:
arr2[0] = 99
arr

array([99,  1, 33, 33, 33])

In [43]:
arr2[:] = 5555
arr

array([5555, 5555,   33,   33,   33])

In [44]:
arr3 = arr.copy()
arr4 = arr3[0:2]
arr4[:] = 999
arr

array([5555, 5555,   33,   33,   33])

In [45]:
arr2d = np.array([[1, 2, 3], [4, 5, 6], [7, 8, 9]])

In [46]:
arr2d[0][1]

2

In [47]:
arr2d[0, 1]

2

In [48]:
arr2d[0, 1] = 99
arr2d

array([[ 1, 99,  3],
       [ 4,  5,  6],
       [ 7,  8,  9]])

In [49]:
arr3d = np.array([[ [1, 2, 3],[4, 5, 6]], [[7, 8, 9], [10, 11, 12]] ])
print(arr3d)
print("\n", arr3d[0,1,2])
print("\n", arr3d[1])
print("\n", arr3d[1,1])

[[[ 1  2  3]
  [ 4  5  6]]

 [[ 7  8  9]
  [10 11 12]]]

 6

 [[ 7  8  9]
 [10 11 12]]

 [10 11 12]


In [50]:
x = arr3d[1].copy()

In [51]:
x

array([[ 7,  8,  9],
       [10, 11, 12]])

In [52]:
x[0]

array([7, 8, 9])

In [53]:
x[0,2] = 99

In [54]:
arr3d

array([[[ 1,  2,  3],
        [ 4,  5,  6]],

       [[ 7,  8,  9],
        [10, 11, 12]]])

In [55]:
x

array([[ 7,  8, 99],
       [10, 11, 12]])

### Indexing with slices

In [56]:
arr = np.array([ 0,  1,  2,  3,  4, 64, 64, 64,  8,  9])
arr[1:6]

array([ 1,  2,  3,  4, 64])

In [57]:
arr2d

array([[ 1, 99,  3],
       [ 4,  5,  6],
       [ 7,  8,  9]])

In [58]:
arr2d[:2]

array([[ 1, 99,  3],
       [ 4,  5,  6]])

In [59]:
arr2d[:2,1:]

array([[99,  3],
       [ 5,  6]])

In [60]:
arr2d[:2,1]

array([99,  5])

In [61]:
arr2d[1,:2]

array([4, 5])

In [62]:
arr2d[:2, 2]

array([3, 6])

In [63]:
arr2d[:, :1]

array([[1],
       [4],
       [7]])

In [64]:
print(arr2d)
arr2d[:2, 1:] = 0
print(arr2d[:2, 1:].shape)
print(arr2d)

[[ 1 99  3]
 [ 4  5  6]
 [ 7  8  9]]
(2, 2)
[[1 0 0]
 [4 0 0]
 [7 8 9]]


In [65]:
arr2d=np.random.randn(3,3)
print(arr2d)
arr2d[2] = 0
print(arr2d[2].shape)
print(arr2d)

[[-0.26497439  0.52358103 -0.58707552]
 [ 0.46426188  0.78830894 -0.11122949]
 [ 0.54205313 -2.06462012 -1.80440672]]
(3,)
[[-0.26497439  0.52358103 -0.58707552]
 [ 0.46426188  0.78830894 -0.11122949]
 [ 0.          0.          0.        ]]


In [66]:
arr2d=np.random.randn(3,3)
print(arr2d)
arr2d[2] = 0
print(arr2d[2].shape)
print(arr2d)

[[ 0.60965149 -1.07966425  1.81412387]
 [ 0.24492279 -0.43773485 -0.60522452]
 [-0.64358887  1.14429629 -1.65746855]]
(3,)
[[ 0.60965149 -1.07966425  1.81412387]
 [ 0.24492279 -0.43773485 -0.60522452]
 [ 0.          0.          0.        ]]


In [67]:
import numpy as np
array3d = np.array([[[1,2,3],[4,5,6]],[[7,8,9],[10,11,12]]])
array3d

array([[[ 1,  2,  3],
        [ 4,  5,  6]],

       [[ 7,  8,  9],
        [10, 11, 12]]])

In [68]:
a3d_cp=array3d[0].copy()
array3d[0]=13
array3d

array([[[13, 13, 13],
        [13, 13, 13]],

       [[ 7,  8,  9],
        [10, 11, 12]]])

In [69]:
array3d[0]=a3d_cp
array3d

array([[[ 1,  2,  3],
        [ 4,  5,  6]],

       [[ 7,  8,  9],
        [10, 11, 12]]])

In [70]:
x=array3d[1]
x

array([[ 7,  8,  9],
       [10, 11, 12]])

In [71]:
arr2d=np.array([[1, 2, 3],[4, 5, 6],[7, 8, 9]])
arr2d

array([[1, 2, 3],
       [4, 5, 6],
       [7, 8, 9]])

In [72]:
arr2d[1:,1:]

array([[5, 6],
       [8, 9]])

In [73]:
arr2d[:2,1:]

array([[2, 3],
       [5, 6]])

In [74]:
arr2d[1,:2]

array([4, 5])

In [75]:
arr2d[:2,2]

array([3, 6])

In [76]:
arr2d[:,:1]

array([[1],
       [4],
       [7]])

## Boolean indexing

In [77]:
names = np.array(['Bob', 'Joe', 'Will', 'Bob', 'Will', 'Joe', 'Joe'])
names


array(['Bob', 'Joe', 'Will', 'Bob', 'Will', 'Joe', 'Joe'], dtype='<U4')

In [78]:
data = np.random.randn(7, 4)*0.5+100
data

array([[100.34449414, 100.1180271 ,  99.40327959, 100.06891679],
       [101.0334102 , 100.46268886, 100.38845864,  99.31592058],
       [100.03688625, 100.18192506,  99.40541583,  99.95654739],
       [100.11316482, 100.20061934, 100.44819574, 101.01705587],
       [100.22161572, 100.24783584,  99.57867978,  99.67168027],
       [ 99.50835723, 100.06032479, 100.13980205, 100.53335573],
       [101.13157204, 100.37130025,  99.70085831, 100.53353285]])

In [79]:
names == 'Bob'

array([ True, False, False,  True, False, False, False])

In [80]:
data[names=='Bob']

array([[100.34449414, 100.1180271 ,  99.40327959, 100.06891679],
       [100.11316482, 100.20061934, 100.44819574, 101.01705587]])

In [81]:
data[names=='Bob', 2:]

array([[ 99.40327959, 100.06891679],
       [100.44819574, 101.01705587]])

In [82]:
data[names=='Bob', 3]

array([100.06891679, 101.01705587])

In [83]:
data[~(names=='Bob')]

array([[101.0334102 , 100.46268886, 100.38845864,  99.31592058],
       [100.03688625, 100.18192506,  99.40541583,  99.95654739],
       [100.22161572, 100.24783584,  99.57867978,  99.67168027],
       [ 99.50835723, 100.06032479, 100.13980205, 100.53335573],
       [101.13157204, 100.37130025,  99.70085831, 100.53353285]])

In [84]:
cond = names=='Bob'

In [85]:
data[~cond]

array([[101.0334102 , 100.46268886, 100.38845864,  99.31592058],
       [100.03688625, 100.18192506,  99.40541583,  99.95654739],
       [100.22161572, 100.24783584,  99.57867978,  99.67168027],
       [ 99.50835723, 100.06032479, 100.13980205, 100.53335573],
       [101.13157204, 100.37130025,  99.70085831, 100.53353285]])

In [86]:
mask = (names=='Bob') | (names=='Joe')
mask

array([ True,  True, False,  True, False,  True,  True])

In [87]:
data[~mask]

array([[100.03688625, 100.18192506,  99.40541583,  99.95654739],
       [100.22161572, 100.24783584,  99.57867978,  99.67168027]])

In [88]:
data[data>100]=999
data

array([[999.        , 999.        ,  99.40327959, 999.        ],
       [999.        , 999.        , 999.        ,  99.31592058],
       [999.        , 999.        ,  99.40541583,  99.95654739],
       [999.        , 999.        , 999.        , 999.        ],
       [999.        , 999.        ,  99.57867978,  99.67168027],
       [ 99.50835723, 999.        , 999.        , 999.        ],
       [999.        , 999.        ,  99.70085831, 999.        ]])

In [89]:
data[names != 'Joe'] = 7
data

array([[  7.        ,   7.        ,   7.        ,   7.        ],
       [999.        , 999.        , 999.        ,  99.31592058],
       [  7.        ,   7.        ,   7.        ,   7.        ],
       [  7.        ,   7.        ,   7.        ,   7.        ],
       [  7.        ,   7.        ,   7.        ,   7.        ],
       [ 99.50835723, 999.        , 999.        , 999.        ],
       [999.        , 999.        ,  99.70085831, 999.        ]])

## Fancy indexing

In [90]:
import numpy as np
arr = np.empty((8,4))
print(arr)

[[1.89008963e-316 0.00000000e+000 0.00000000e+000 0.00000000e+000]
 [6.94635322e-310 5.02034658e+175 1.83093485e-076 8.85418137e+165]
 [2.44898059e-056 1.77428229e+160 1.53079487e-047 4.25942538e-096]
 [1.12855837e+277 8.93168725e+271 4.76484771e+180 1.70098498e+256]
 [5.49109388e-143 6.99645177e+228 1.35617292e+248 9.62734727e+183]
 [4.47032825e-090 6.17042841e-062 4.81721212e-038 1.05931250e+165]
 [5.28555805e+180 6.74640243e-067 6.98476580e-076 5.06636306e-086]
 [3.35558939e-143 9.30350598e+199 4.24941018e-086 6.94650366e-310]]


In [91]:
for i in range(arr.shape[0]):
    arr[i]=i
arr

array([[0., 0., 0., 0.],
       [1., 1., 1., 1.],
       [2., 2., 2., 2.],
       [3., 3., 3., 3.],
       [4., 4., 4., 4.],
       [5., 5., 5., 5.],
       [6., 6., 6., 6.],
       [7., 7., 7., 7.]])

In [92]:
arr[[4,3,0,6]]

array([[4., 4., 4., 4.],
       [3., 3., 3., 3.],
       [0., 0., 0., 0.],
       [6., 6., 6., 6.]])

In [93]:
arr = np.arange(32)
arr = arr.reshape(8,4)

In [94]:
arr[[1, 5, 7, 2], [0, 3, 1, 2]]

array([ 4, 23, 29, 10])

## Transposing arrays & swapping axes

In [109]:
arr = np.arange(15).reshape(3,5)
arr

array([[ 0,  1,  2,  3,  4],
       [ 5,  6,  7,  8,  9],
       [10, 11, 12, 13, 14]])

In [113]:
arr.T # not inplace

array([[ 0,  5, 10],
       [ 1,  6, 11],
       [ 2,  7, 12],
       [ 3,  8, 13],
       [ 4,  9, 14]])

In [114]:
arr 

array([[ 0,  1,  2,  3,  4],
       [ 5,  6,  7,  8,  9],
       [10, 11, 12, 13, 14]])

In [115]:
arr = np.random.randn(6, 3)
arr

array([[ 1.81578587,  0.61554645,  0.02643213],
       [ 0.06212248, -0.44277317, -0.65404883],
       [-0.3591492 , -0.28545245,  1.10228936],
       [ 1.88969219, -0.89329646, -0.78162397],
       [ 0.88569147, -0.86741562,  1.3446729 ],
       [-0.52296404,  1.1153712 , -1.20118521]])

In [116]:
np.dot(arr.T, arr) # 3,6 x 6,3

array([[ 8.05880304, -1.84690259, -0.04640913],
       [-1.84690259,  3.45086995, -1.81672146],
       [-0.04640913, -1.81672146,  5.50544752]])

In [99]:
a = range(20)
a = [3 for x in a]
a = np.array(a).reshape(5,4)
a

array([[3, 3, 3, 3],
       [3, 3, 3, 3],
       [3, 3, 3, 3],
       [3, 3, 3, 3],
       [3, 3, 3, 3]])

In [100]:
b = np.dot(a, a.T)
b

array([[36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36]])

In [101]:
c = a @ a.T
c

array([[36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36],
       [36, 36, 36, 36, 36]])

In [119]:
arr = np.arange(16).reshape((2, 2, 4))
arr

array([[[ 0,  1,  2,  3],
        [ 4,  5,  6,  7]],

       [[ 8,  9, 10, 11],
        [12, 13, 14, 15]]])

In [123]:
arr.transpose((1, 0, 2))

array([[[ 0,  1,  2,  3],
        [ 8,  9, 10, 11]],

       [[ 4,  5,  6,  7],
        [12, 13, 14, 15]]])

In [102]:
arr = np.arange(16).reshape((2, 2, 4))

In [103]:
arr

array([[[ 0,  1,  2,  3],
        [ 4,  5,  6,  7]],

       [[ 8,  9, 10, 11],
        [12, 13, 14, 15]]])

In [104]:
arr.T

array([[[ 0,  8],
        [ 4, 12]],

       [[ 1,  9],
        [ 5, 13]],

       [[ 2, 10],
        [ 6, 14]],

       [[ 3, 11],
        [ 7, 15]]])

In [105]:
a = arr.swapaxes(1,2)
a

array([[[ 0,  4],
        [ 1,  5],
        [ 2,  6],
        [ 3,  7]],

       [[ 8, 12],
        [ 9, 13],
        [10, 14],
        [11, 15]]])

In [106]:
b = arr.swapaxes(1,0) # esto no lo entiendo!
b

array([[[ 0,  1,  2,  3],
        [ 8,  9, 10, 11]],

       [[ 4,  5,  6,  7],
        [12, 13, 14, 15]]])

## Universal functions: Fast Element-Wise Array Functions

In [125]:
arr = np.arange(10)
arr

array([0, 1, 2, 3, 4, 5, 6, 7, 8, 9])

In [129]:
np.sqrt(arr)

array([0.        , 1.        , 1.41421356, 1.73205081, 2.        ,
       2.23606798, 2.44948974, 2.64575131, 2.82842712, 3.        ])

In [130]:
np.sum(arr)

45

In [131]:
np.exp(arr)

array([1.00000000e+00, 2.71828183e+00, 7.38905610e+00, 2.00855369e+01,
       5.45981500e+01, 1.48413159e+02, 4.03428793e+02, 1.09663316e+03,
       2.98095799e+03, 8.10308393e+03])

In [137]:
x = np.random.randn(5)
display(x)
y = np.random.randn(5)
display(y)
np.maximum(x, y)

array([ 1.40500477,  0.08869926, -0.29663349, -0.54552558, -0.24698511])

array([-0.71706502, -1.54459508, -1.03622708,  0.78936051,  1.13990757])

array([ 1.40500477,  0.08869926, -0.29663349,  0.78936051,  1.13990757])

In [142]:
x = np.random.randn(3) * 4
entera, decimal = np.modf(x)
print(x, entera, decimal, sep="\n")

[-5.11387038 -6.70351665 -0.98301614]
[-0.11387038 -0.70351665 -0.98301614]
[-5. -6. -0.]


In [152]:
x = np.arange(10)
div, rest = np.divmod(x, 2)
print(x, a, b, sep="\n")

[0 1 2 3 4 5 6 7 8 9]
[0 0 1 1 2 2 3 3 4 4]
[0 1 0 1 0 1 0 1 0 1]


In [159]:
arr = np.array([-3.2623, 6.0915, -6.663])   
print(arr)
out_arr = np.zeros_like(arr)
print(out_arr)
np.add(arr, 1, out=out_arr)
print(arr, out_arr, sep="\n")

[-3.2623  6.0915 -6.663 ]
[0. 0. 0.]
[-3.2623  6.0915 -6.663 ]
[-2.2623  7.0915 -5.663 ]


In [165]:
np.log1p(arr)

  np.log1p(arr)


array([       nan, 1.95889688,        nan])