In [2]:
import torch
import pandas as pd 
import numpy as np 
import matplotlib.pyplot as plt
print(torch.__version__)

2.0.0.dev20230121


## Introduction of tensor

### creating tensors

In [5]:
# scalar
scalar = torch.tensor(7)
scalar

tensor(7)

In [6]:
scalar.ndim

0

In [7]:
# get tensor back as python int
scalar.item()

7

In [9]:
# vector
vector = torch.tensor([7,7])
vector

tensor([7, 7])

In [10]:
vector.ndim

1

In [11]:
vector.shape

torch.Size([2])

In [12]:
# Matrix

MATRIX = torch.tensor([[7,8], [9,10]])
MATRIX

tensor([[ 7,  8],
        [ 9, 10]])

In [13]:
MATRIX.ndim

2

In [14]:
MATRIX[0]

tensor([7, 8])

In [15]:
# Tensor
TENSOR = torch.tensor([[[1,2,3],
                       [4,5,6],
                       [7,8,9]
                       ]])

In [16]:
TENSOR

tensor([[[1, 2, 3],
         [4, 5, 6],
         [7, 8, 9]]])

In [17]:
TENSOR.ndim

3

In [18]:
TENSOR.shape

torch.Size([1, 3, 3])

### Random tensors

Random tensors are important because the way many neural netowrks learn is they start
with tensors full of random numbers and then adjust those random numbers to beter represent the data.
Start with random numbers -> look at the data --> update the numbers --> look at the data --> update the numbers

In [19]:
# create a random tensors of size(3,4)
random_tensor = torch.rand(3,4)
random_tensor

tensor([[0.1803, 0.3257, 0.9739, 0.6404],
        [0.4163, 0.8624, 0.7314, 0.3623],
        [0.7169, 0.2239, 0.2888, 0.7522]])

In [24]:
# create a random tensor with similar shape to an image tensor
random_image_size_tensor = torch.rand(size=(3, 224, 224))
print(random_image_size_tensor.ndim)

3


In [25]:
random_image_size_tensor.shape

torch.Size([3, 224, 224])

In [26]:
random_image_size_tensor.size()

torch.Size([3, 224, 224])

### Zero and Ones 

In [29]:
# create a tensor of all zeros

zeros = torch.zeros(size=(3,4))
zeros

tensor([[0., 0., 0., 0.],
        [0., 0., 0., 0.],
        [0., 0., 0., 0.]])

In [31]:
# create a tensor of all ones
ones = torch.ones(size=(3,4))
ones

tensor([[1., 1., 1., 1.],
        [1., 1., 1., 1.],
        [1., 1., 1., 1.]])

In [32]:
ones.dtype

torch.float32

In [33]:
random_image_size_tensor.dtype

torch.float32

#### creating a range of tensors and tensors-like

In [34]:
# Use torch.arange()
one_to_thousand = torch.arange(start=0, end=1001, step = 20)
one_to_thousand

tensor([   0,   20,   40,   60,   80,  100,  120,  140,  160,  180,  200,  220,
         240,  260,  280,  300,  320,  340,  360,  380,  400,  420,  440,  460,
         480,  500,  520,  540,  560,  580,  600,  620,  640,  660,  680,  700,
         720,  740,  760,  780,  800,  820,  840,  860,  880,  900,  920,  940,
         960,  980, 1000])

In [36]:
# creating tensors like
thousand_zeros = torch.zeros_like(input=one_to_thousand)
thousand_zeros

tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
        0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0,
        0, 0, 0])

### Tensor Datatypes
Most common errors with datatypes:
1. Tensors not right datatype
2. Tensors not right shape
3. Tensors not on the right device

In [41]:
# Float 32 tensor
float_32_tensor = torch.tensor([3.0,6.0,9.0],
                              dtype=None, # what datatype the tensor is
                              device=None, # what device is the tensor on
                              requires_grad=False) # wheter or not to track gradients with this tensors operation

In [40]:
float_32_tensor.dtype

torch.float32

In [42]:
# changing dtype
float_16_tensor = float_32_tensor.type(torch.float16)
float_16_tensor

tensor([3., 6., 9.], dtype=torch.float16)

In [43]:
int_32_tensor = torch.tensor([3,4,5], dtype=torch.int64)


In [44]:
int_32_tensor * float_32_tensor

tensor([ 9., 24., 45.])

In [45]:
random_tensor.device

device(type='cpu')

### Manipulating Tensors(Tensors operations)
Tensors operations 
* Addition
* Substraction
* Multiplication (element wise)
* Division
* Matrix Multiplication

In [46]:
# Creating a tensor
tensor = torch.tensor([1,2,3])
tensor + 100

tensor([101, 102, 103])

In [47]:
# Multiply 
tensor * 10

tensor([10, 20, 30])

In [48]:
# substract
tensor - 100

tensor([-99, -98, -97])

In [49]:
torch.mul(tensor, 20)

tensor([20, 40, 60])

### Matrix Multiplication

Two ways - 
* element wise
* matrix multiplication or dot product

There are two main rules that performing matrix multiply needs to be meet
1. The **inner dimension** must match
2. The resulting matrix has the shape of **outer dimension**

In [50]:
# Element wise
tensor * tensor

tensor([1, 4, 9])

In [52]:
# Dot product
torch.matmul(tensor, tensor)

tensor(14)

#### Transpose a matrix

to change the dimension of a matrix, have to use Transpose

In [53]:
random_tensor

tensor([[0.1803, 0.3257, 0.9739, 0.6404],
        [0.4163, 0.8624, 0.7314, 0.3623],
        [0.7169, 0.2239, 0.2888, 0.7522]])

In [54]:
random_tensor.T

tensor([[0.1803, 0.4163, 0.7169],
        [0.3257, 0.8624, 0.2239],
        [0.9739, 0.7314, 0.2888],
        [0.6404, 0.3623, 0.7522]])

In [56]:
random_tensor.shape

torch.Size([3, 4])

In [57]:
random_tensor @ random_tensor

RuntimeError: mat1 and mat2 shapes cannot be multiplied (3x4 and 3x4)

In [58]:
random_tensor @ random_tensor.T

tensor([[1.4971, 1.3002, 0.9651],
        [1.3002, 1.5832, 0.9752],
        [0.9651, 0.9752, 1.2132]])

### Finding the min, max, mean, sum etc. (tensor aggeration)

In [59]:
one_to_thousand.min()

tensor(0)

In [60]:
one_to_thousand.max()

tensor(1000)

In [66]:
# Find the mean - torch.mean requires float type datatype
one_to_thousand.mean()

RuntimeError: mean(): could not infer output dtype. Input dtype must be either a floating point or complex dtype. Got: Long

In [67]:
torch.mean(one_to_thousand.type(torch.float32))

tensor(500.)

In [68]:
torch.mean(one_to_thousand, dtype=torch.float32)

tensor(500.)

In [69]:
torch.sum(one_to_thousand)

tensor(25500)

#### Finding the positional max and min 

In [73]:
random_tensor.argmax()

tensor(2)

In [74]:
random_tensor.argmin()

tensor(0)

### Reshaping, stacking, squeezing and unsqueezing tensors
* torch.reshape(input, shape)-->	Reshapes input to shape (if compatible), can also use torch.Tensor.reshape().
* torch.Tensor.view(shape)-->	Returns a view of the original tensor in a different shape but shares the same data as the original tensor.
* torch.stack(tensors, dim=0)-->	Concatenates a sequence of tensors along a new dimension (dim), all tensors must be same size.
* torch.squeeze(input)-->	Squeezes input to remove all the dimenions with value 1.
* torch.unsqueeze(input, dim)-->	Returns input with a dimension value of 1 added at dim.
* torch.permute(input, dims)-->	Returns a view of the original input with its dimensions permuted (rearranged) to dims.

In [76]:
x = torch.arange(1.,10)

In [77]:
x

tensor([1., 2., 3., 4., 5., 6., 7., 8., 9.])

In [78]:
x, x.shape

(tensor([1., 2., 3., 4., 5., 6., 7., 8., 9.]), torch.Size([9]))

In [79]:
x_reshaped = x.reshape(1,9)
x_reshaped, x_reshaped.shape

(tensor([[1., 2., 3., 4., 5., 6., 7., 8., 9.]]), torch.Size([1, 9]))

In [80]:
x_reshaped = x.reshape(9,1)
x_reshaped, x_reshaped.shape

(tensor([[1.],
         [2.],
         [3.],
         [4.],
         [5.],
         [6.],
         [7.],
         [8.],
         [9.]]),
 torch.Size([9, 1]))

In [81]:
# changing the view
z = x.view(1,9)
z, z.shape

(tensor([[1., 2., 3., 4., 5., 6., 7., 8., 9.]]), torch.Size([1, 9]))

In [82]:
# changes z changes x (they share the same memory)
z[:, 0] = 5
z

tensor([[5., 2., 3., 4., 5., 6., 7., 8., 9.]])

In [83]:
x

tensor([5., 2., 3., 4., 5., 6., 7., 8., 9.])

In [84]:
# stack tensors on top of each other
x_stacked = torch.stack([x, x, x, x, x], dim=1)
x_stacked

tensor([[5., 5., 5., 5., 5.],
        [2., 2., 2., 2., 2.],
        [3., 3., 3., 3., 3.],
        [4., 4., 4., 4., 4.],
        [5., 5., 5., 5., 5.],
        [6., 6., 6., 6., 6.],
        [7., 7., 7., 7., 7.],
        [8., 8., 8., 8., 8.],
        [9., 9., 9., 9., 9.]])

In [85]:
x_stacked = torch.stack([x, x, x, x, x], dim=0)
x_stacked

tensor([[5., 2., 3., 4., 5., 6., 7., 8., 9.],
        [5., 2., 3., 4., 5., 6., 7., 8., 9.],
        [5., 2., 3., 4., 5., 6., 7., 8., 9.],
        [5., 2., 3., 4., 5., 6., 7., 8., 9.],
        [5., 2., 3., 4., 5., 6., 7., 8., 9.]])

In [88]:
# torch,squeeze() - removes all the single dimenstions from a target tensor
x_reshaped.squeeze().ndim

1

In [89]:
x_reshaped.ndim

2

In [93]:
# torch.unsqueeze adds a single dimension to a target tensor
x_squeezed = x_reshaped.squeeze()
x_squeezed.unsqueeze(dim=0)

tensor([[5., 2., 3., 4., 5., 6., 7., 8., 9.]])

In [94]:
x_squeezed.unsqueeze(dim=1)

tensor([[5.],
        [2.],
        [3.],
        [4.],
        [5.],
        [6.],
        [7.],
        [8.],
        [9.]])

In [96]:
x_squeezed.unsqueeze(dim=-1)


tensor([[5.],
        [2.],
        [3.],
        [4.],
        [5.],
        [6.],
        [7.],
        [8.],
        [9.]])

In [98]:
# torch.permute - rearrange the dimensions of a target tensor in a specified order
x_original = torch.rand(size=(224, 224, 3))
x_permuted = x_original.permute(2,0,1)


In [99]:
print(x_original.shape)
print(x_permuted.shape)

torch.Size([224, 224, 3])
torch.Size([3, 224, 224])


### Indexing 
Similar to NumPy

In [100]:
x = torch.arange(1, 10).reshape(1,3,3)
x, x.shape

(tensor([[[1, 2, 3],
          [4, 5, 6],
          [7, 8, 9]]]),
 torch.Size([1, 3, 3]))

In [101]:
x[0][0]

tensor([1, 2, 3])

In [102]:
x[0,0]

tensor([1, 2, 3])

In [103]:
x[0, 0, 1]

tensor(2)

In [108]:
x[:,:, 2]

tensor([[3, 6, 9]])

In [109]:
x[:,1,1]

tensor([5])

In [110]:
x[0,0,:]

tensor([1, 2, 3])

#### Reproducibility 
(trying to take the random out of random)¶


In [111]:
RANDOM_SEED=42 # try changing this to different values and see what happens to the numbers below
torch.manual_seed(seed=RANDOM_SEED) 
random_tensor_C = torch.rand(3, 4)

# Have to reset the seed every time a new rand() is called 
# Without this, tensor_D would be different to tensor_C 
torch.random.manual_seed(seed=RANDOM_SEED) # try commenting this line out and seeing what happens
random_tensor_D = torch.rand(3, 4)

print(f"Tensor C:\n{random_tensor_C}\n")
print(f"Tensor D:\n{random_tensor_D}\n")
print(f"Does Tensor C equal Tensor D? (anywhere)")
random_tensor_C == random_tensor_D

Tensor C:
tensor([[0.8823, 0.9150, 0.3829, 0.9593],
        [0.3904, 0.6009, 0.2566, 0.7936],
        [0.9408, 0.1332, 0.9346, 0.5936]])

Tensor D:
tensor([[0.8823, 0.9150, 0.3829, 0.9593],
        [0.3904, 0.6009, 0.2566, 0.7936],
        [0.9408, 0.1332, 0.9346, 0.5936]])

Does Tensor C equal Tensor D? (anywhere)


tensor([[True, True, True, True],
        [True, True, True, True],
        [True, True, True, True]])