In [2]:
!nvidia-smi

Wed Oct 22 17:03:24 2025       
+-----------------------------------------------------------------------------------------+
| NVIDIA-SMI 581.57                 Driver Version: 581.57         CUDA Version: 13.0     |
+-----------------------------------------+------------------------+----------------------+
| GPU  Name                  Driver-Model | Bus-Id          Disp.A | Volatile Uncorr. ECC |
| Fan  Temp   Perf          Pwr:Usage/Cap |           Memory-Usage | GPU-Util  Compute M. |
|                                         |                        |               MIG M. |
|   0  NVIDIA GeForce RTX 3050 ...  WDDM  |   00000000:01:00.0 Off |                  N/A |
| N/A   49C    P3             13W /   30W |       0MiB /   4096MiB |      0%      Default |
|                                         |                        |                  N/A |
+-----------------------------------------+------------------------+----------------------+

+----------------------------------------------

In [3]:
import torch
import pandas as pd 
import numpy as np 
import matplotlib.pyplot as plt 
print(torch.__version__)

2.6.0+cu124


## Introduction to Tensors

### Creating Tensors

In [4]:
#scalar
scalar=torch.tensor(7)
scalar

tensor(7)

In [5]:
scalar.ndim

0

In [None]:
## Get tensor back as Python int
scalar.item()

7

In [14]:
## Vector
vector=torch.tensor([7,7])
vector

tensor([7, 7])

In [15]:
vector.ndim

1

In [16]:
vector.shape

torch.Size([2])

In [17]:
## Matrix 
matrix=torch.tensor([[7,8],
                     [9,10]])
matrix

tensor([[ 7,  8],
        [ 9, 10]])

In [19]:
print(matrix.ndim)
print(matrix.shape)

2
torch.Size([2, 2])


In [20]:
# Tensor
tensor=torch.tensor([[[1,2,3],
                      [3,6,9],
                      [2,4,5]]])
tensor

tensor([[[1, 2, 3],
         [3, 6, 9],
         [2, 4, 5]]])

In [21]:
print(tensor.ndim)
print(tensor.shape)

3
torch.Size([1, 3, 3])


### Random Tensors

Why random tensors?

Random tensors are important because the way many neural networks learn is that they start with tensors full of random numbers and then adjust those random numbers to better represent the data

`Start with random numbers -> look at data -> update random numbers -> look at data -> update random numbers

In [29]:
## Create a random tensor of size(3,4)
random_tensor=torch.rand(3,4)
random_tensor

tensor([[0.0307, 0.3151, 0.8957, 0.5877],
        [0.1686, 0.2410, 0.7083, 0.0096],
        [0.9134, 0.9289, 0.2741, 0.4778]])

In [30]:
random_tensor.ndim

2

In [35]:
random_tensor=torch.rand(2,3,4)
random_tensor

tensor([[[0.8752, 0.4234, 0.5757, 0.2753],
         [0.5302, 0.3484, 0.2808, 0.8763],
         [0.1061, 0.2356, 0.8507, 0.7256]],

        [[0.8294, 0.7103, 0.9853, 0.3060],
         [0.2823, 0.6152, 0.4800, 0.1039],
         [0.2506, 0.6467, 0.1709, 0.4256]]])

In [32]:
random_tensor.ndim

3

In [37]:
## Create a random tensor with similar shape to an image tensor
random_image_size_tensor=torch.rand(size=(3,224,224)) # height,width,colour channels
random_image_size_tensor.shape,random_image_size_tensor.ndim

(torch.Size([3, 224, 224]), 3)

In [None]:
# Create a tensor of all zero
zero=torch.zeros(size=(3,4))
zero

tensor([[0., 0., 0., 0.],
        [0., 0., 0., 0.],
        [0., 0., 0., 0.]])

In [39]:
zero*random_tensor

tensor([[[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]],

        [[0., 0., 0., 0.],
         [0., 0., 0., 0.],
         [0., 0., 0., 0.]]])

In [40]:
## Create a tensor of all ones 
ones=torch.ones(size=(3,4))
ones

tensor([[1., 1., 1., 1.],
        [1., 1., 1., 1.],
        [1., 1., 1., 1.]])

## Creating a range of tensors and tensors-like

In [None]:
# use torch.arange()
one_to_ten=torch.arange(start=0,end=1000,step=80)
one_to_ten

tensor([  0,  80, 160, 240, 320, 400, 480, 560, 640, 720, 800, 880, 960])

In [46]:
#Create tensors like
ten_zeroes=torch.zeros_like(input=one_to_ten)
ten_zeroes

tensor([0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0, 0])

## Tensor datatypes

Tensor datatypes is one of the 3 big errors you'll run into with PyTorch & Deep learning:

1. Tensors not right datatype
2. Tensors not right shape
3. Tensors not on the right device

In [None]:
# Float 32 tensors
float_32_tensor=torch.tensor([3.0,6.0,9.0],
                             dtype=None,   ## What datatype is the tensor (e.g. float32,float16)
                             device="cpu", ## Switching to cpu or gpu(cuda) 
                             requires_grad=False)  ## Whether or not to track gradients with this tensor
float_32_tensor

tensor([3., 6., 9.])

In [50]:
float_32_tensor.dtype

torch.float32

In [51]:
float_16_tensor=float_32_tensor.type(torch.float16)
float_16_tensor

tensor([3., 6., 9.], dtype=torch.float16)

In [53]:
(float_16_tensor*float_32_tensor).dtype

torch.float32