In [2]:
import torch
import pandas as pd
import numpy as np
import matplotlib.pyplot as plt

In [3]:
print(torch.cuda.is_available())
print(torch.__version__)

True
2.0.0


Introduction to tensors
##### Create tensor
Pytorch tensors are created using the torch.tensor() function. The function takes in a list or a numpy array as an argument and returns a tensor.
https://pytorch.org/docs/stable/tensors.html

In [4]:
# Scalar
scalar = torch.tensor(7)
print(scalar)

tensor(7)


In [5]:
print(scalar.ndim)

0


In [6]:
# Get tensor back as python int
print(scalar.item())

7


In [7]:
# Vector
vector = torch.tensor([7, 7])
print(vector)


tensor([7, 7])


In [8]:
print(vector.ndim)

1


In [9]:
vector.shape

torch.Size([2])

In [10]:
# Matrix
MATRIX = torch.tensor([ [7, 8], 
                        [9, 10]
                    ])
print(MATRIX)

tensor([[ 7,  8],
        [ 9, 10]])


In [11]:
print(MATRIX.ndim)

2


In [12]:
print(MATRIX[1])

tensor([ 9, 10])


In [13]:
print(MATRIX.shape) # return in form of tuple (row, column)

torch.Size([2, 2])


In [14]:
# TENSORS
TENSOR = torch.tensor([[[1, 2, 3],
                        [3, 6, 9],
                        [2, 4, 5]],
                    ])
print(TENSOR)

tensor([[[1, 2, 3],
         [3, 6, 9],
         [2, 4, 5]]])


In [15]:
print(TENSOR.ndim)

3


In [16]:
print(TENSOR.shape) # return in form of tuple (dimention, row, column)

torch.Size([1, 3, 3])


In [17]:
print(TENSOR[0])

tensor([[1, 2, 3],
        [3, 6, 9],
        [2, 4, 5]])


#### Random tensors
Random tensors are important because the way many neural network learn is that they start with tensors full or random numbers and then adjust those random numbers to better represent the data. <br>
- Start with random numbers -> look at data -> update random number -> look at data -> update random number <br>
More information: https://pytorch.org/docs/stable/generated/torch.rand.html

In [18]:
# Create a random tensor of size (3, 4)
random_tensor = torch.rand(3, 4) # 3 row and 4 column
print(random_tensor)

tensor([[0.0310, 0.5228, 0.1162, 0.2556],
        [0.7432, 0.8796, 0.9716, 0.7536],
        [0.9741, 0.8295, 0.3390, 0.1651]])


In [19]:
random_tensor.ndim

2

In [20]:
random_tensor_1layer = torch.rand(1, 3, 4) # 1 dimention, 10 row and 10 column
print(random_tensor_1layer)

tensor([[[0.9945, 0.2964, 0.6171, 0.1014],
         [0.4859, 0.5382, 0.5900, 0.6121],
         [0.7877, 0.5424, 0.8356, 0.5103]]])


In [21]:
random_tensor_1layer.ndim

3

In [22]:
# Create a random tensor with similar shape to an image tensor
random_image_size_tensor = torch.rand(size = (3, 224, 224)) # color channel, height, width 
print(f'size = {random_image_size_tensor.shape}\nndim = {random_image_size_tensor.ndim}')

size = torch.Size([3, 224, 224])
ndim = 3


In [23]:
print(random_image_size_tensor)

tensor([[[0.6163, 0.6510, 0.5861,  ..., 0.5207, 0.4022, 0.4576],
         [0.6774, 0.8582, 0.4636,  ..., 0.8828, 0.1652, 0.6994],
         [0.6451, 0.1811, 0.6932,  ..., 0.9235, 0.8675, 0.5687],
         ...,
         [0.5426, 0.2362, 0.9250,  ..., 0.2601, 0.2886, 0.7972],
         [0.0261, 0.6683, 0.7264,  ..., 0.3603, 0.8001, 0.4031],
         [0.5631, 0.3102, 0.4428,  ..., 0.7122, 0.7425, 0.1240]],

        [[0.7880, 0.9999, 0.3862,  ..., 0.4134, 0.1310, 0.7351],
         [0.0170, 0.9099, 0.2129,  ..., 0.7645, 0.0618, 0.2743],
         [0.1035, 0.5554, 0.6000,  ..., 0.2552, 0.3833, 0.3320],
         ...,
         [0.9599, 0.2829, 0.0562,  ..., 0.2857, 0.0031, 0.6838],
         [0.1097, 0.3847, 0.0177,  ..., 0.2178, 0.3740, 0.0229],
         [0.6369, 0.0565, 0.1347,  ..., 0.4852, 0.9552, 0.1291]],

        [[0.3407, 0.2418, 0.2287,  ..., 0.1022, 0.4294, 0.6361],
         [0.2459, 0.8747, 0.6877,  ..., 0.7403, 0.2354, 0.2466],
         [0.3176, 0.1717, 0.1824,  ..., 0.9488, 0.2278, 0.

### Zeros and Ones tensors

In [24]:
# Create a tensor of all zeros
zeros = torch.zeros(size = (3, 4))
print(zeros)

tensor([[0., 0., 0., 0.],
        [0., 0., 0., 0.],
        [0., 0., 0., 0.]])


In [25]:
print(zeros * random_tensor)

tensor([[0., 0., 0., 0.],
        [0., 0., 0., 0.],
        [0., 0., 0., 0.]])


In [26]:
# Create tensor of all ones
ones = torch.ones(size = (3, 4))
print(ones)

tensor([[1., 1., 1., 1.],
        [1., 1., 1., 1.],
        [1., 1., 1., 1.]])


In [27]:
print(ones.dtype)

torch.float32


In [28]:
print(random_tensor.dtype)

torch.float32


### Crating a range of tensors and tensors-like

In [29]:
# user torch.range() and get deprecated message, user torch.arange() instead
one_to_ten = torch.arange(start = 1, end = 11, step = 1)
print(one_to_ten)

tensor([ 1,  2,  3,  4,  5,  6,  7,  8,  9, 10])


In [30]:
# Creating tensor like (It's same with shape of another tensor)
ten_zeros = torch.zeros_like(input = one_to_ten)
print(ten_zeros)

tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0])


### Tensor Datatypes
More : https://pytorch.org/docs/stable/tensors.html

**Note** Tensor datatypes is one of the big 3 errors you'll run into with Pytorch & Deep learning:
1. Tensors not right datatype
2. Tensors not right shape
3. Tensors not on the right device

Precision in computing - https://en.wikipedia.org/wiki/Precision_(computer_science)

In [31]:
# Float 32 tensor when dtype is not defined torch will use float 32
float_32_tensor = torch.tensor([3.0, 6.0, 9.0],
                               dtype = None, # It's datatype of tensor e.g. torch.float16, torch.float32, torch.float64 or etc.
                               device = None, # It's device of tensor e.g. None, 'cpu', 'cuda', 'cuda:0', 'cuda:1' or etc.
                               requires_grad = False) # It's for gradient calculation
print(float_32_tensor)

tensor([3., 6., 9.])


In [32]:
print(float_32_tensor.dtype)

torch.float32


In [33]:
# Change tensor type from float 32 to float 16
float_16_tensor = float_32_tensor.type(torch.float16)
print(float_16_tensor)

tensor([3., 6., 9.], dtype=torch.float16)


In [34]:
float_16_tensor * float_32_tensor

tensor([ 9., 36., 81.])

In [35]:
int_32_tensor = torch.tensor([3, 6, 9], dtype = torch.int32)
print(int_32_tensor)

tensor([3, 6, 9], dtype=torch.int32)


In [36]:
float_32_tensor * int_32_tensor

tensor([ 9., 36., 81.])

### Getting information from tensors
- Tensor attributes
1. Tensors not right datatype - to do get datatype from a tensor, can use the tensor.dtype attribute
2. Tensors not right shape - to do get shape from a tensor, can use the tensor.shape attribute
3. Tensors not on the right device - to do get device from a tensor, can use the tensor.device attribute

In [37]:
# Create a tensor
some_tensor = torch.rand(3, 4)
print(some_tensor)

tensor([[0.6061, 0.8154, 0.7687, 0.5634],
        [0.9220, 0.8562, 0.5223, 0.6688],
        [0.0563, 0.6181, 0.1441, 0.5378]])


In [38]:
print(f'Size = {some_tensor.shape}\nShape = {some_tensor.shape}')

Size = torch.Size([3, 4])
Shape = torch.Size([3, 4])


In [39]:
# Find out detail about some tensor
print(some_tensor)
print(f'Datatype of tensor: {some_tensor.dtype}')
print(f'Shape of tensor: {some_tensor.shape}')
print(f'Device tensor is stored on: {some_tensor.device}')

tensor([[0.6061, 0.8154, 0.7687, 0.5634],
        [0.9220, 0.8562, 0.5223, 0.6688],
        [0.0563, 0.6181, 0.1441, 0.5378]])
Datatype of tensor: torch.float32
Shape of tensor: torch.Size([3, 4])
Device tensor is stored on: cpu


### Manipulating tensors ( tensor operations )

Tensor opreration include:
* Addition
* Subtraction
* Multiplication (element-wise)
* Division 
* Matrix multiplication

In [40]:
# Create a tensor  and add 10 to it
tensor = torch.tensor([1, 2, 3])
tensor + 10

tensor([11, 12, 13])

In [41]:
# Multiply our tensor by 10
tensor * 10

tensor([10, 20, 30])

In [42]:
# Substract by 10
tensor - 10

tensor([-9, -8, -7])

In [43]:
# Try out PyTorch in-built function
torch.multiply(tensor, 10) # or torch.mul(tensor, 10)

tensor([10, 20, 30])

In [44]:
torch.add(tensor, 10)

tensor([11, 12, 13])

### Matrix multiplication

Two main ways of performing multiplication in neural networks and deep learning:

1. Element-wise multiplication
2. Matrix multiplication ( Dot product )

More information on multiplying matrices - https://www.mathsisfun.com/algebra/matrix-multiplying.html

There are two main rules that performing matrix multiplication needs to satisfy:
1. The **Inner dimensions** must match:
* `(3, 2) @ (3 , 2) ` won't work
* `(2, 3) @ (3 , 2) ` will work
* `(3, 2) @ (2 , 3) ` will work
2. The result matrix has the shape of the **Outer dimensions**:
* `(2, 3) @ (3, 2)` will result in a `(2, 2)` matrix
* `(3, 2) @ (2, 3)` will result in a `(3, 3)` matrix

Matrix multiplication application - http://matrixmultiplication.xyz/

In [45]:
# Element wise multiplication
print(tensor, '*', tensor)
print(f'Equal: {tensor * tensor}')

tensor([1, 2, 3]) * tensor([1, 2, 3])
Equal: tensor([1, 4, 9])


In [46]:
# Matrix multiplication
torch.matmul(tensor, tensor)

tensor(14)

In [47]:
# Matrix multiplication by hand
1 * 1 + 2 * 2 + 3 * 3

14

In [48]:
%%time
value = 0
for i in range(len(tensor)):
    value += tensor[i] * tensor[i]
print(value)

tensor(14)
CPU times: total: 0 ns
Wall time: 0 ns


In [49]:
%%time
torch.matmul(tensor, tensor)

CPU times: total: 0 ns
Wall time: 0 ns


tensor(14)

### One of the most common errors in deep learning: shape errors

In [50]:
# Shape for matrix multiplication
tensor_A = torch.tensor([[1, 2],
                         [3, 4],
                         [5, 6]])
tensor_B = torch.tensor([[7, 10],
                         [8, 11],
                         [9, 12]])
torch.mm(tensor_A, tensor_B) # torch.mm it's same with torch.matmul

RuntimeError: mat1 and mat2 shapes cannot be multiplied (3x2 and 3x2)

Matmul used for matrix multiplication that is not square e.g. 3x2 and 2x3 or 3x2 and 2x4 <br> ( row of first matrix must be equal to column of second matrix )

How to fixed shape errors, user **transpose()** method to transpose a matrix <br>
A transpose is when you flip a matrix along its diagonal ( turning rows into columns and vice versa )


In [51]:
tensor_B

tensor([[ 7, 10],
        [ 8, 11],
        [ 9, 12]])

In [52]:
tensor_B.T

tensor([[ 7,  8,  9],
        [10, 11, 12]])

In [53]:
# Try to used matmul with transpose
torch.matmul(tensor_A, tensor_B.T)

tensor([[ 27,  30,  33],
        [ 61,  68,  75],
        [ 95, 106, 117]])

In [58]:
# Matrix multiplication
print(f'Original shape of tensor A: {tensor_A.shape}, tensor B: {tensor_B.shape}')
print(f'New shapes of tensor A: {tensor_A.shape}, tensor B.T: {tensor_B.T.shape}')
print(f'Multiply tensor A: {tensor_A.shape} by tensor B.T: {tensor_B.T.shape} <- Inner dimension must match \nusing torch.matmul:\n {torch.matmul(tensor_A, tensor_B.T)}\nOutput shape: {torch.matmul(tensor_A, tensor_B.T).shape}')

Original shape of tensor A: torch.Size([3, 2]), tensor B: torch.Size([3, 2])
New shapes of tensor A: torch.Size([3, 2]), tensor B.T: torch.Size([2, 3])
Multiply tensor A: torch.Size([3, 2]) by tensor B.T: torch.Size([2, 3]) <- Inner dimension must match 
using torch.matmul:
 tensor([[ 27,  30,  33],
        [ 61,  68,  75],
        [ 95, 106, 117]])
Output shape: torch.Size([3, 3])


## Finding the min, max, mean, sum, etc. (tensor aggregations)

In [80]:
# Create a tensor
x = torch.arange(1, 100, 10)
print(x)
print(x.dtype)

tensor([ 1, 11, 21, 31, 41, 51, 61, 71, 81, 91])
torch.int64


In [81]:
# Find min
torch.min(x), x.min()

(tensor(1), tensor(1))

In [82]:
# Find max
torch.max(x), x.max()

(tensor(91), tensor(91))

In [83]:
# Find mean
torch.mean(x)

RuntimeError: mean(): could not infer output dtype. Input dtype must be either a floating point or complex dtype. Got: Long

In [84]:
# Find mean - Note: torch.mean() required tensor type to be float32
# Change type to float32
torch.mean(x.type(torch.float32))

tensor(46.)

In [85]:
# Convert type with argument
torch.mean(x, dtype = torch.float32)

tensor(46.)

In [86]:
x.type(torch.float32).mean()

tensor(46.)

## Finding the positional maximum and minimum

In [87]:
x

tensor([ 1, 11, 21, 31, 41, 51, 61, 71, 81, 91])

In [95]:
# Find the position of the minimum value with argmin() -> return index position of target minimum value
pos_min = x.argmin()

In [96]:
x[pos_min]

tensor(1)

In [97]:
# Find the position in tensor that has the maximum value with argmax() -> return index position of target maximum value
pos_max = x.argmax()
pos_max

tensor(9)

In [98]:
x[pos_max]

tensor(91)

## Reshapeing, stacking, squeezing, unsqueezing tensor
* Reshape - reshapes an input tensor to a defined shape
* View - Return a view of an input tensor of certain shaoe but keep the same memory as the original tensor
* Stacking - Combine multiple tensors on top of each other (vstack) or side by side (hstack)
* Squeezing - Remove all `1` dimensions from a tensor
* Unsqueeze - Add a dimension of size `1` to a tensor
* Permute - Return a view of the input with dimension permuted (swapped) in a certain way