# AUTOGRAD: AUTOMATIC DIFFERENTIATION
The autograd package provides automatic differentiation for all operations on Tensors
# Tensor
`torch.Tensor` is the central class of the package.If you set its attribute `.requires_grad` as True, it starts to track all operations on it.When you finish your computation you can call `.backward()` and have all the gradients computed automatically. The gradient for this tensor will be accumulated into `.grad` attribute  


In [1]:
import torch

# Create a tensor and set `requires_grad=True`to track computation with it
x = torch.ones(2, 2, requires_grad=True)
print(x)

tensor([[1., 1.],
        [1., 1.]], requires_grad=True)


In [2]:
# do some operations
y = x + 2
print(y)

tensor([[3., 3.],
        [3., 3.]], grad_fn=<AddBackward0>)


In [3]:
print(y.grad_fn)

<AddBackward0 object at 0x000001FA9F302408>


In [4]:
z = y * y * 3
out = z.mean()

print(z, out)

tensor([[27., 27.],
        [27., 27.]], grad_fn=<MulBackward0>) tensor(27., grad_fn=<MeanBackward0>)


In [6]:
# 生成tensor时`requires_grad`默认为False
a = torch.randn(2, 2)
a = ((a * 3) / (a - 1))
print(a.requires_grad)
a.requires_grad_(True)  # 修改`requires_grad`属性，_后缀代表in-place
print(a.requires_grad)
b = (a * a).sum()
print(b.grad_fn)

False
True
<SumBackward0 object at 0x000001FA9F3BCCC8>


# Gradients

In [9]:
# out.backward()
print(x.grad)  # before backprop

None


In [10]:
out.backward()
print(x.grad)  # after backprop

tensor([[4.5000, 4.5000],
        [4.5000, 4.5000]])


In [11]:
x = torch.randn(3, requires_grad=True)

y = x * 2

In [17]:
while y.data.norm() < 1000:
    y = y * 2
print(y)

tensor([-214.0495, -737.4357, 1294.8801], grad_fn=<MulBackward0>)


In [20]:
y.backward()  # y这里不为标量
print(x.grad)

RuntimeError: grad can be implicitly created only for scalar outputs

In [21]:
# Now in this case y is no longer a scalar. torch.autograd could not compute 
# the full Jacobian directly, but if we just want the vector-Jacobian product, 
# simply pass the vector to backward as argument:
v = torch.tensor([0.1, 1.0, 0.001], dtype=torch.float)
y.backward(v)
print(x.grad)

tensor([ 204.8000, 2048.0000,    2.0480])


# 截断autograd的方式
- 设置`.requires_grad=True`: tensor.requires_grad_(True)
- 使用`with torch.no_grad():`包裹代码块
- 使用`.detach()`得到与原tensor内容相同但不需要梯度的tensor

In [22]:
print(x.requires_grad)
print((x ** 2).requires_grad)

with torch.no_grad():
    print((x ** 2).requires_grad)

True
True
False


In [23]:
print(x.requires_grad)
y = x.detach()
print(y.requires_grad)
print(x.eq(y).all())

True
False
tensor(True)


# 关于auto.grad.Function的使用
待续...