My first HTML document

# @ c input_image: torch tensor as input image
input_image=torch.ones(2,2)
print(input_image)
# tensor([[1., 1.],
#         [1., 1.]])

# @ c trainable_param_in_layer1: trainable parameter in layer1, which is initialized by 1s
trainable_param_in_layer1=input_tensor=torch.ones(2,2)
print(input_tensor)
# tensor([[1., 1.],
#         [1., 1.]])

# @ c trainable_param_in_layer1: trainable parameter in layer1 
# with option requires_grad=True
trainable_param_in_layer1=Variable(trainable_param_in_layer1,requires_grad=True)
print(trainable_param_in_layer1)
# tensor([[1., 1.],
#         [1., 1.]], requires_grad=True)

print(trainable_param_in_layer1.data)
# tensor([[1., 1.],
#         [1., 1.]])

print(trainable_param_in_layer1.grad)
# None
# because trainable_param_in_layer1 hadn't performed operation yet

print(trainable_param_in_layer1.grad_fn)
# None
# because trainable_param_in_layer1 hadn't performed operation yet

# @ Create layer1 by using trainable_param_in_layer1
# layer1: (trainable_param_in_layer1*x)+2

# @ Pass input_image into layer1 and get output_from_layer1
output_from_layer1=(tensor_after_layer1*input_image)+2

# @ Create loss function layer
loss: loss_value=output_from_layer1+100

# Initialize trainable parameter by 1
trainable_param_in_layer1=torch.ones(2,2)

# Note you use requires_grad=True
trainable_param_in_layer1=Variable(trainable_param_in_layer1,requires_grad=True)

output_from_layer1=input_image*trainable_param_in_layer1

final_loss_value=output_from_layer1.sum()

# Do \frac{\partial final_loss_value}{\partial trainable_param_in_layer1}
final_loss_value.backward()

import torch
from torch.autograd import Variable

a=torch.ones(2,2)
# 1 1
# 1 1

a=Variable(a,requires_grad=True)

# ================================================================================
print(a.data)
# 1 1
# 1 1

print(a.grad)
# None
# Because you didn't perform any operation

print(a.grad_fn)
# None
# Because you didn't perform any operation

# ================================================================================
b=a+2
print(b)
# 3 3
# 3 3

c=b**2
print(c)
# 9 9
# 9 9

out=c.cum()
print(out)
# 36 36
# 36 36

# ================================================================================
# To update a, you should calculate \frac{\partial out}{\partial a} 
# \frac{\partial out}{\partial a} is stored into a.grad

# torch.autograd directly calculates \frac{\partial out}{\partial a} 
# without you using chain rule of dout/da=dout/dsum*dsum/dc*dc/db/*db/da
out.backward()

# ================================================================================
print(a.data)
# 1 1
# 1 1

print(a.grad)
# 6 6
# 6 6

print(a.grad_fn)
# None
# Because there is no operation a did

# ================================================================================
print(b.data)
# 3 3
# 3 3

print(b.grad)
# None
# because b doesn't have option of requires_grad=True

print(b.grad_fn)
# AddBackward0
# To calculate dout/da, PyTorch performed AddBackward0 operation
# because b=a+2

# ================================================================================
print(c.data)
# 9 9
# 9 9

print(c.grad)
# None
# because c doesn't have option of requires_grad=True

print(c.grad_fn)
# PowBackward0
# To calculate dout/da, PyTorch performed PowBackward0 operation
# because c=b^2

# ================================================================================
print(out.data)
# 36
# 9 9

print(out.grad)
# None
# because out doesn't have option of requires_grad=True

print(out.grad_fn)
# SumBackward0
# To calculate dout/da, PyTorch performed SumBackward0 operation
# because out=c.sum()

x=torch.ones(3)
x=Variable(x,requires_grad=True)

y=x**2

z=y*3
print(z)
# 3
# 3
# 3

# ================================================================================
grad=torch.Tensor([0.1,1,10])

# Perform \frac{\partial z}{\partial x}
z.backward(grad)

# ================================================================================
print(x.data)
# 1
# 1
# 1

print(x.grad)
# 0.6
# 6.0
# 60.0
# Since \frac{\partial z}{\partial x}=6 and you passed grad=torch.Tensor([0.1,1,10])
# you get above numbers

print(x.grad_fn)
# None