# Tensors Tutorial

In [1]:
import torch
import numpy as np

%matplotlib inline

# Tensors 

* Tensors are a specialized data structure that are very similar to arrays and matrices. 
* In PyTorch, we use tensors to encode the inputs and outputs of a model, as well as the model’s parameters.
* Tensors are similar to `NumPy’s`(https://numpy.org/) ndarrays, except that tensors can run on GPUs or other hardware accelerators. In fact, tensors and NumPy arrays can often share the same underlying memory, eliminating the need to copy data. 
* Tensors are also optimized for automatic differentiation.

# Initializing a Tensor

* Tensors can be initialized in various ways. 

## Directly from data

Tensors can be created directly from data. The data type is automatically inferred.

In [2]:
data_list = [[1, 2],[3, 4]]
data_tensor = torch.tensor(data_list)
print("Type of data_tensor is {}".format(type(data_tensor)))
print(data_tensor)
print()
print(data_tensor.numpy())

Type of data_tensor is <class 'torch.Tensor'>
tensor([[1, 2],
        [3, 4]])

[[1 2]
 [3 4]]


## From a NumPy array

Tensors can be created from NumPy arrays.

In [3]:
data_array = np.array(data_list)
data_tensor = torch.from_numpy(data_array)
print(data_array)
print()
print(data_tensor)

[[1 2]
 [3 4]]

tensor([[1, 2],
        [3, 4]], dtype=torch.int32)


## From another tensor

The new tensor retains the properties (shape, datatype) of the argument tensor, unless explicitly overridden.

In [4]:
tensor_ones = torch.ones_like(data_tensor) # retains the properties of data_tensor
print(tensor_ones)

tensor([[1, 1],
        [1, 1]], dtype=torch.int32)


In [5]:
# overrides the datatype of data_tensor
tensor_rand = torch.rand_like(data_tensor, dtype = torch.float) 
print(tensor_rand)

tensor([[0.7022, 0.1215],
        [0.3356, 0.1004]])


## With random or constant values

``shape`` is a tuple of tensor dimensions. In the functions below, it determines the dimensionality of the output tensor.

In [6]:
shape = (2, 3,)
rand_tensor = torch.rand(shape)
ones_tensor = torch.ones(shape)
zeros_tensor = torch.zeros(shape)

print("Random Tensor: \n{}".format(rand_tensor))
print()
print("Ones Tensor: \n{}".format(ones_tensor))
print()
print("Zeros Tensor: \n{}".format(zeros_tensor))

Random Tensor: 
tensor([[0.0278, 0.0421, 0.4777],
        [0.2340, 0.9918, 0.7121]])

Ones Tensor: 
tensor([[1., 1., 1.],
        [1., 1., 1.]])

Zeros Tensor: 
tensor([[0., 0., 0.],
        [0., 0., 0.]])


# Attributes of a Tensor

* Tensor attributes describe their shape, datatype, and the device on which they are stored.

In [7]:
tensor = torch.rand(3, 4)

print(f"Shape of tensor: {tensor.shape}")
print(f"Datatype of tensor: {tensor.dtype}")
print(f"Device tensor is stored on: {tensor.device}")

Shape of tensor: torch.Size([3, 4])
Datatype of tensor: torch.float32
Device tensor is stored on: cpu


# Operations on Tensors

Over 100 tensor operations, including arithmetic, linear algebra, matrix manipulation (transposing, 
indexing, slicing), sampling and more are comprehensively described [`here`](https://pytorch.org/docs/stable/torch.html).

Each of these operations can be run on the GPU (at typically higher speeds than on a
CPU). By default, tensors are created on the CPU. We need to explicitly move tensors to the GPU using 
``.to`` method (after checking for GPU availability). Copying large tensors across devices can be expensive in terms of time and memory!

In [8]:
# We move our tensor to the GPU if available
if torch.cuda.is_available():
    print("Moving tensor to GPU")
    tensor = tensor.to('cuda')
else:
    print("Tensor retained in CPU")

Tensor retained in CPU


# Standard numpy-like indexing and slicing

In [9]:
tensor = torch.ones(4, 4)
print('First row: ',tensor[0])
print('First column: ', tensor[:, 0])
print('Last column:', tensor[..., -1])
tensor[:,1] = 0
print(tensor)

First row:  tensor([1., 1., 1., 1.])
First column:  tensor([1., 1., 1., 1.])
Last column: tensor([1., 1., 1., 1.])
tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]])


# Joining tensors

* We can use ``torch.cat`` to concatenate a sequence of tensors along a given dimension.
See also [`torch.stack`](https://pytorch.org/docs/stable/generated/torch.stack.html),
another tensor joining op that is subtly different from ``torch.cat``.

In [10]:
t1 = torch.cat([tensor, tensor, tensor], dim = 1)
print(t1)

tensor([[1., 0., 1., 1., 1., 0., 1., 1., 1., 0., 1., 1.],
        [1., 0., 1., 1., 1., 0., 1., 1., 1., 0., 1., 1.],
        [1., 0., 1., 1., 1., 0., 1., 1., 1., 0., 1., 1.],
        [1., 0., 1., 1., 1., 0., 1., 1., 1., 0., 1., 1.]])


# Arithmetic operations



## Matrix mulitplication of two tensors

In [11]:
# This computes the matrix multiplication between two tensors. y1, y2, y3 will have the same value
y1 = tensor @ tensor.T
print(y1)
print()
y2 = tensor.matmul(tensor.T)
print(y2)
print()
y3 = torch.rand_like(tensor)
print(y3)
print()
torch.matmul(tensor, tensor.T, out = y3)
print(y3)
print()

tensor([[3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.]])

tensor([[3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.]])

tensor([[0.4688, 0.7768, 0.5937, 0.5240],
        [0.5187, 0.4903, 0.6823, 0.5828],
        [0.3995, 0.2597, 0.8673, 0.3126],
        [0.8863, 0.8272, 0.2687, 0.4854]])

tensor([[3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.],
        [3., 3., 3., 3.]])



## Element-wise multiplication of two tensors

In [12]:
# This computes the element-wise product. z1, z2, z3 will have the same value
z1 = tensor * tensor
z2 = tensor.mul(tensor)
z3 = torch.rand_like(tensor)
torch.mul(tensor, tensor, out = z3)
print(z1)
print()
print(z2)
print()
print(z3)

tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]])

tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]])

tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]])


# Single-element tensors

* If we have a one-element tensor, for example by aggregating all values of a tensor into one value, we can convert it to a Python numerical value using ``item()``:

In [13]:
print(tensor)
print()
agg = tensor.sum()
print(agg)
print()
agg_item = agg.item()  
print(agg_item, type(agg_item))
print()

tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]])

tensor(12.)

12.0 <class 'float'>



# In-place operations

* Operations that store the result into the operand are called in-place. They are denoted by a ``_`` suffix. 
* For example: ``x.copy_(y)``, ``x.t_()``, will change ``x``.

In [14]:
print(tensor, "\n")
tensor.add_(5)
print(tensor)

tensor([[1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.],
        [1., 0., 1., 1.]]) 

tensor([[6., 5., 6., 6.],
        [6., 5., 6., 6.],
        [6., 5., 6., 6.],
        [6., 5., 6., 6.]])


<b>In-place operations save some memory, but can be problematic when computing derivatives because of an immediate loss of history. Hence, their use is discouraged.</b>


# Bridge with NumPy

* Tensors on the CPU and NumPy arrays can share their underlying memory locations, and changing one will change	the other.

## Convert Tensor to NumPy array

In [15]:
t = torch.ones(5)
print(f"t: {t}")
n = t.numpy()
print(f"n: {n}")

t: tensor([1., 1., 1., 1., 1.])
n: [1. 1. 1. 1. 1.]


<b>A change in the tensor reflects in the NumPy array.</b>

In [16]:
t.add_(1)
print(f"t: {t}")
print(f"n: {n}")

t: tensor([2., 2., 2., 2., 2.])
n: [2. 2. 2. 2. 2.]


## Convert NumPy array to Tensor

In [20]:
n = np.ones(5)
t = torch.from_numpy(n)
print(f"n: {n}")
print(f"t: {t}")

n: [1. 1. 1. 1. 1.]
t: tensor([1., 1., 1., 1., 1.], dtype=torch.float64)


<b>Changes in the NumPy array reflects in the tensor.</b>

In [21]:
np.add(n, 1, out = n)
print(f"t: {t}")
print(f"n: {n}")

t: tensor([2., 2., 2., 2., 2.], dtype=torch.float64)
n: [2. 2. 2. 2. 2.]
