In [1]:
import torch

# Scalars

In [2]:
x=torch.tensor(3.0)
y=torch.tensor(2.0)
x+y,x*y,x/y,x**y

(tensor(5.), tensor(6.), tensor(1.5000), tensor(9.))

# Vectors

In [3]:
x=torch.arange(3)
x

tensor([0, 1, 2])

In [4]:
x[2]

tensor(2)

In [5]:
len(x)

3

In [6]:
x.shape

torch.Size([3])

# Matrices

In [7]:
A=torch.arange(6).reshape(3,2)
A

tensor([[0, 1],
        [2, 3],
        [4, 5]])

In [8]:
A.T

tensor([[0, 2, 4],
        [1, 3, 5]])

In [9]:
A=torch.tensor([[1,2,3],[2,0,4],[3,4,5]])
A==A.T

tensor([[True, True, True],
        [True, True, True],
        [True, True, True]])

# Tensors

In [10]:
torch.arange(24).reshape(2,3,4)

tensor([[[ 0,  1,  2,  3],
         [ 4,  5,  6,  7],
         [ 8,  9, 10, 11]],

        [[12, 13, 14, 15],
         [16, 17, 18, 19],
         [20, 21, 22, 23]]])

# Basic Properties of Tensor Arithmetic

In [11]:
A=torch.arange(6,dtype=torch.float32).reshape(2,3)
B=A.clone()
A,A+B

(tensor([[0., 1., 2.],
         [3., 4., 5.]]),
 tensor([[ 0.,  2.,  4.],
         [ 6.,  8., 10.]]))

In [12]:
A*B #elementwise product

tensor([[ 0.,  1.,  4.],
        [ 9., 16., 25.]])

In [13]:
a=2
X=torch.arange(24).reshape(2,3,4)
a+X,(a*X).shape

(tensor([[[ 2,  3,  4,  5],
          [ 6,  7,  8,  9],
          [10, 11, 12, 13]],
 
         [[14, 15, 16, 17],
          [18, 19, 20, 21],
          [22, 23, 24, 25]]]),
 torch.Size([2, 3, 4]))

# Reduction

In [14]:
x=torch.arange(3,dtype=torch.float32)
x,x.sum()

(tensor([0., 1., 2.]), tensor(3.))

In [15]:
A.shape,A.sum()

(torch.Size([2, 3]), tensor(15.))

In [16]:
A.shape,A.sum(axis=0) #sum of elements along the rows

(torch.Size([2, 3]), tensor([3., 5., 7.]))

In [17]:
A.shape,A.sum(axis=1) #sum of elements along the cols

(torch.Size([2, 3]), tensor([ 3., 12.]))

In [18]:
A.sum(axis=[0,1])==A.sum()

tensor(True)

In [19]:
A.mean(),A.sum()/A.numel()

(tensor(2.5000), tensor(2.5000))

In [20]:
A.mean(axis=0),A.sum(axis=0)/A.shape[0]

(tensor([1.5000, 2.5000, 3.5000]), tensor([1.5000, 2.5000, 3.5000]))

# Non-Reduction Sum

In [21]:
sum_A=A.sum(axis=1,keepdims=True)
sum_A,sum_A.shape

(tensor([[ 3.],
         [12.]]),
 torch.Size([2, 1]))

In [22]:
A/sum_A

tensor([[0.0000, 0.3333, 0.6667],
        [0.2500, 0.3333, 0.4167]])

In [23]:
A.cumsum(axis=0)

tensor([[0., 1., 2.],
        [3., 5., 7.]])

# Dot Products

In [24]:
y=torch.ones(3,dtype=torch.float32)
x,y,torch.dot(x,y)

(tensor([0., 1., 2.]), tensor([1., 1., 1.]), tensor(3.))

In [25]:
torch.sum(x*y)

tensor(3.)

# Matrix-Vector Products

In [26]:
A.shape,x.shape,torch.mv(A,x),A@x

(torch.Size([2, 3]), torch.Size([3]), tensor([ 5., 14.]), tensor([ 5., 14.]))

# Matrix–Matrix Multiplication

In [27]:
B=torch.ones(3,4)
torch.mm(A,B),A@B

(tensor([[ 3.,  3.,  3.,  3.],
         [12., 12., 12., 12.]]),
 tensor([[ 3.,  3.,  3.,  3.],
         [12., 12., 12., 12.]]))

# Norms

In [28]:
u=torch.tensor([3.0,-4.0])
torch.norm(u) #l2 norm

tensor(5.)

In [29]:
torch.abs(u).sum() #l1 norm

tensor(7.)

In [30]:
torch.norm(torch.ones((4,9))) # Frobenius norm of a matrix.

tensor(6.)

# Exercises

In [31]:
A=torch.arange(4).reshape(2,2)
B=torch.arange(4).reshape(2,2)
A,B

(tensor([[0, 1],
         [2, 3]]),
 tensor([[0, 1],
         [2, 3]]))

In [32]:
A==A.T.T

tensor([[True, True],
        [True, True]])

In [33]:
A.T+B.T==(A+B).T

tensor([[True, True],
        [True, True]])

In [34]:
A+A.T==(A+A.T).T # A+A.T always symmetric

tensor([[True, True],
        [True, True]])

In [35]:
len(X)

2

In [36]:
A/A.sum(axis=1),A.sum(axis=1)

(tensor([[0.0000, 0.2000],
         [2.0000, 0.6000]]),
 tensor([1, 5]))

In [37]:
X.sum(axis=0),X.sum(axis=1),X.sum(axis=2)

(tensor([[12, 14, 16, 18],
         [20, 22, 24, 26],
         [28, 30, 32, 34]]),
 tensor([[12, 15, 18, 21],
         [48, 51, 54, 57]]),
 tensor([[ 6, 22, 38],
         [54, 70, 86]]))