# Lab 1: Tensor Manipulation

First Author: Seungjae Ryan Lee (seungjaeryanlee at gmail dot com)
Second Author: Ki Hyun Kim (nlp.with.deep.learning at gmail dot com)

<div class="alert alert-warning">
    NOTE: This corresponds to <a href="https://www.youtube.com/watch?v=ZYX0FaqUeN4&t=23s&list=PLlMkM4tgfjnLSOjrEJN31gZATbcj_MpUm&index=25">Lab 8 of Deep Learning Zero to All Season 1 for TensorFlow</a>.
</div>

## Imports

Run `pip install -r requirements.txt` in terminal to install all required Python packages.

In [None]:
import numpy as np
import torch

## NumPy Review

We hope that you are familiar with `numpy` and basic linear algebra.

### 1D Array with NumPy

In [None]:
t = np.array([0., 1., 2., 3., 4., 5., 6.])
print(t)

In [None]:
print('Rank  of t: ', t.ndim)
print('Shape of t: ', t.shape)

In [None]:
print('t[0] t[1] t[-1] = ', t[0], t[1], t[-1]) # Element
print('t[2:5] t[4:-1]  = ', t[2:5], t[4:-1])   # Slicing
print('t[:2] t[3:]     = ', t[:2], t[3:])      # Slicing

### 2D Array with NumPy

In [None]:
t = np.array([[1., 2., 3.], [4., 5., 6.], [7., 8., 9.], [10., 11., 12.]])
print(t)

In [None]:
print('Rank  of t: ', t.ndim)
print('Shape of t: ', t.shape)

## PyTorch is like NumPy (but better)

### 1D Array with PyTorch

In [None]:
t = np.array([0., 1., 2., 3., 4., 5., 6.])
t

In [None]:
t = torch.FloatTensor([0., 1., 2., 3., 4., 5., 6.])
print(t)

In [None]:
print(t.dim())  # rank
print(t.shape)  # shape
print(t.size()) # shape
print(t[0], t[1], t[-1])  # Element
print(t[2:5], t[4:-1])    # Slicing
print(t[:2], t[3:])       # Slicing

In [None]:
print(t.size())

### 2D Array with PyTorch

In [None]:
t = torch.FloatTensor([[1., 2., 3.],
                       [4., 5., 6.],
                       [7., 8., 9.],
                       [10., 11., 12.]
                      ])
print(t)

In [None]:
print(t.dim())  # rank
print(t.size()) # shape
print(t[:, 1])
print(t[:, 1].size())
print(t[:, :-1])

In [None]:
print(t[0,0])

### Shape, Rank, Axis

In [None]:
t = torch.FloatTensor([[[[1, 2, 3, 4],
                         [5, 6, 7, 8],
                         [9, 10, 11, 12]],
                       [[13, 14, 15, 16],
                        [17, 18, 19, 20],
                        [21, 22, 23, 24]]
                       ]])

In [None]:
t

In [None]:
print(t.dim())  # rank  = 4
print(t.size()) # shape = (1, 2, 3, 4)

## Frequently Used Operations in PyTorch

### Mul vs. Matmul

In [None]:
print()
print('-------------')
print('Mul vs Matmul')
print('-------------')
m1 = torch.FloatTensor([[1, 2], [3, 4]])
m2 = torch.FloatTensor([[1], [2]])
print(m1)
print(m2)

In [None]:
print('Shape of Matrix 1: ', m1.shape) # 2 x 2
print('Shape of Matrix 2: ', m2.shape) # 2 x 1


In [None]:
print(m1.matmul(m2)) # 2 x 1


In [None]:

m1 = torch.FloatTensor([[1, 2], [3, 4]])
m2 = torch.FloatTensor([[1], [2]])
print(m1)
print(m2)

In [None]:
print('Shape of Matrix 1: ', m1.shape) # 2 x 2
print('Shape of Matrix 2: ', m2.shape) # 2 x 1
print(m1 * m2) # 2 x 2
print(m1.mul(m2))

### Broadcasting

<div class="alert alert-warning">
    Carelessly using broadcasting can lead to code hard to debug.
</div>

In [None]:
# Same shape
m1 = torch.FloatTensor([[3, 3]])
m2 = torch.FloatTensor([[2, 2]])
print(m1 + m2)

In [None]:
# Vector + scalar
m1 = torch.FloatTensor([[1, 2]])
m2 = torch.FloatTensor([3]) # 3 -> [[3, 3]]
print(m1 + m2)

In [None]:
# 2 x 1 Vector + 1 x 2 Vector
m1 = torch.FloatTensor([[1, 2]])
m2 = torch.FloatTensor([[3], [4]])
print(m1 + m2)

### Mean

In [None]:
t = torch.FloatTensor([1, 2])
print(t.mean())

In [None]:
# Can't use mean() on integers
t = torch.LongTensor([1, 2])
try:
    print(t.mean())
except Exception as exc:
    print(exc)

You can also use `t.mean` for higher rank tensors to get mean of all elements, or mean by particular dimension.

In [None]:
t = torch.FloatTensor([[1, 2], [3, 4]])
print(t)

In [None]:
print(t.mean())
print(t.mean(dim=0))
print(t.mean(dim=1))
print(t.mean(dim=-1))

### Sum

In [None]:
t = torch.FloatTensor([[1, 2], [3, 4]])
print(t)

In [None]:
print(t.sum())
print(t.sum(dim=0))
print(t.sum(dim=1))
print(t.sum(dim=-1))

### Max and Argmax

In [None]:
t = torch.FloatTensor([[1, 2], [3, 4]])
print(t)

The `max` operator returns one value if it is called without an argument.

In [None]:
print(t.max()) # Returns one value: max

The `max` operator returns 2 values when called with dimension specified. The first value is the maximum value, and the second value is the argmax: the index of the element with maximum value.

In [None]:
print(t)

In [None]:
print(t.max(dim=0)) # Returns two values: max and argmax


In [None]:
t.max(dim=0)[0]

In [None]:
print('Max: ', t.max(dim=0)[0])
print('Argmax: ', t.max(dim=0)[1])

In [None]:
print(t.max(dim=1))
print(t.max(dim=-1))

### View

<div class="alert alert-warning">
    This is a function hard to master, but is very useful!
</div>

In [None]:
t = np.array([[[0, 1, 2],
               [3, 4, 5]],

              [[6, 7, 8],
               [9, 10, 11]]])
ft = torch.FloatTensor(t)
print(ft.shape)

In [None]:
print(ft.view([-1, 3]))
print(ft.view([-1, 3]).shape)

In [None]:
print(ft.view([-1, 1, 3]))
print(ft.view([-1, 1, 3]).shape)

### Squeeze

In [None]:
ft = torch.FloatTensor([[0], [1], [2]])
print(ft)
print(ft.shape)

In [None]:
print(ft.squeeze())
print(ft.squeeze().shape)

### Unsqueeze

In [None]:
ft = torch.Tensor([0, 1, 2])
print(ft.shape)

In [None]:
print(ft.unsqueeze(0))
print(ft.unsqueeze(0).shape)

In [None]:
print(ft.view(1, -1))
print(ft.view(1, -1).shape)

In [None]:
print(ft.unsqueeze(1))
print(ft.unsqueeze(1).shape)

In [None]:
print(ft.unsqueeze(-1))
print(ft.unsqueeze(-1).shape)

### Scatter (for one-hot encoding)

<div class="alert alert-warning">
    Scatter is a very flexible function. We only discuss how to use it to get a one-hot encoding of indices.
</div>

In [None]:
lt = torch.LongTensor([[0], [1], [2], [0]])
print(lt)

In [None]:
one_hot = torch.zeros(4, 3) # batch_size = 4, classes = 3
one_hot

In [None]:
one_hot.scatter_(1, lt, 1)
print(one_hot)

### Casting

In [None]:
lt = torch.LongTensor([1, 2, 3, 4])
print(lt)

In [None]:
print(lt.float())

In [None]:
bt = torch.ByteTensor([True, False, False, True])
print(bt)

In [None]:
print(bt.long())
print(bt.float())

### Concatenation

In [None]:
x = torch.FloatTensor([[1, 2], [3, 4]])
y = torch.FloatTensor([[5, 6], [7, 8]])
print(x)
print(y)

In [None]:
print(torch.cat([x, y], dim=0))
print(torch.cat([x, y], dim=1))

### Stacking

In [None]:
x = torch.FloatTensor([1, 4])
y = torch.FloatTensor([2, 5])
z = torch.FloatTensor([3, 6])

In [None]:
print(torch.stack([x, y, z]))
print(torch.stack([x, y, z], dim=1))

In [None]:
print(torch.cat([x.unsqueeze(0), y.unsqueeze(0), z.unsqueeze(0)], dim=0))

### Ones and Zeros Like

In [None]:
x = torch.FloatTensor([[0, 1, 2], [2, 1, 0]])
print(x)
print(x.size())

In [None]:
print(torch.ones_like(x))
print(torch.zeros_like(x))

### In-place Operation

In [None]:
x = torch.FloatTensor([[1, 2], [3, 4]])

In [None]:
print(x.mul(2.))
print(x)
print(x.mul_(2.))
print(x)

## Miscellaneous

### Zip

In [None]:
for x, y in zip([1, 2, 3], [4, 5, 6]):
    print(x, y)

In [None]:
for x, y, z in zip([1, 2, 3], [4, 5, 6], [7, 8, 9]):
    print(x, y, z)