diff --git a/_downloads/1c22195f47cf0e89ae2e0989dd4be6bb/two_layer_net_optim.py b/_downloads/1c22195f47cf0e89ae2e0989dd4be6bb/two_layer_net_optim.py
deleted file mode 100644
index 82b67dcc1b0..00000000000
--- a/_downloads/1c22195f47cf0e89ae2e0989dd4be6bb/two_layer_net_optim.py
+++ /dev/null
@@ -1,62 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: optim
---------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-
-Rather than manually updating the weights of the model as we have been doing,
-we use the optim package to define an Optimizer that will update the weights
-for us. The optim package defines many optimization algorithms that are commonly
-used for deep learning, including SGD+momentum, RMSProp, Adam, etc.
-"""
-import torch
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Use the nn package to define our model and loss function.
-model = torch.nn.Sequential(
-    torch.nn.Linear(D_in, H),
-    torch.nn.ReLU(),
-    torch.nn.Linear(H, D_out),
-)
-loss_fn = torch.nn.MSELoss(reduction='sum')
-
-# Use the optim package to define an Optimizer that will update the weights of
-# the model for us. Here we will use Adam; the optim package contains many other
-# optimization algorithms. The first argument to the Adam constructor tells the
-# optimizer which Tensors it should update.
-learning_rate = 1e-4
-optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
-for t in range(500):
-    # Forward pass: compute predicted y by passing x to the model.
-    y_pred = model(x)
-
-    # Compute and print loss.
-    loss = loss_fn(y_pred, y)
-    if t % 100 == 99:
-        print(t, loss.item())
-
-    # Before the backward pass, use the optimizer object to zero all of the
-    # gradients for the variables it will update (which are the learnable
-    # weights of the model). This is because by default, gradients are
-    # accumulated in buffers( i.e, not overwritten) whenever .backward()
-    # is called. Checkout docs of torch.autograd.backward for more details.
-    optimizer.zero_grad()
-
-    # Backward pass: compute gradient of the loss with respect to model
-    # parameters
-    loss.backward()
-
-    # Calling the step function on an Optimizer makes an update to its
-    # parameters
-    optimizer.step()
diff --git a/_downloads/22f070e74b4f293045131e7170efe86d/two_layer_net_custom_function.py b/_downloads/22f070e74b4f293045131e7170efe86d/two_layer_net_custom_function.py
deleted file mode 100644
index 2d2a0875669..00000000000
--- a/_downloads/22f070e74b4f293045131e7170efe86d/two_layer_net_custom_function.py
+++ /dev/null
@@ -1,97 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Defining New autograd Functions
-----------------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Variables, and uses PyTorch autograd to compute gradients.
-
-In this implementation we implement our own custom autograd function to perform
-the ReLU function.
-"""
-import torch
-
-
-class MyReLU(torch.autograd.Function):
-    """
-    We can implement our own custom autograd Functions by subclassing
-    torch.autograd.Function and implementing the forward and backward passes
-    which operate on Tensors.
-    """
-
-    @staticmethod
-    def forward(ctx, input):
-        """
-        In the forward pass we receive a Tensor containing the input and return
-        a Tensor containing the output. ctx is a context object that can be used
-        to stash information for backward computation. You can cache arbitrary
-        objects for use in the backward pass using the ctx.save_for_backward method.
-        """
-        ctx.save_for_backward(input)
-        return input.clamp(min=0)
-
-    @staticmethod
-    def backward(ctx, grad_output):
-        """
-        In the backward pass we receive a Tensor containing the gradient of the loss
-        with respect to the output, and we need to compute the gradient of the loss
-        with respect to the input.
-        """
-        input, = ctx.saved_tensors
-        grad_input = grad_output.clone()
-        grad_input[input < 0] = 0
-        return grad_input
-
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0")  # Uncomment this to run on GPU
-# torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU
-
-# The above line disables TensorFloat32. This a feature that allows
-# networks to run at a much faster speed while sacrificing precision.
-# Although TensorFloat32 works well on most real models, for our toy model
-# in this tutorial, the sacrificed precision causes convergence issue.
-# For more information, see:
-# https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold input and outputs.
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Create random Tensors for weights.
-w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-learning_rate = 1e-6
-for t in range(500):
-    # To apply our Function, we use Function.apply method. We alias this as 'relu'.
-    relu = MyReLU.apply
-
-    # Forward pass: compute predicted y using operations; we compute
-    # ReLU using our custom autograd operation.
-    y_pred = relu(x.mm(w1)).mm(w2)
-
-    # Compute and print loss
-    loss = (y_pred - y).pow(2).sum()
-    if t % 100 == 99:
-        print(t, loss.item())
-
-    # Use autograd to compute the backward pass.
-    loss.backward()
-
-    # Update weights using gradient descent
-    with torch.no_grad():
-        w1 -= learning_rate * w1.grad
-        w2 -= learning_rate * w2.grad
-
-        # Manually zero the gradients after updating weights
-        w1.grad.zero_()
-        w2.grad.zero_()
diff --git a/_downloads/39d9c599559353177d1597d787c8e2fd/two_layer_net_nn.py b/_downloads/39d9c599559353177d1597d787c8e2fd/two_layer_net_nn.py
deleted file mode 100644
index 0c1925878e8..00000000000
--- a/_downloads/39d9c599559353177d1597d787c8e2fd/two_layer_net_nn.py
+++ /dev/null
@@ -1,68 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: nn
------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-PyTorch autograd makes it easy to define computational graphs and take gradients,
-but raw autograd can be a bit too low-level for defining complex neural networks;
-this is where the nn package can help. The nn package defines a set of Modules,
-which you can think of as a neural network layer that has produces output from
-input and may have some trainable weights.
-"""
-import torch
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Use the nn package to define our model as a sequence of layers. nn.Sequential
-# is a Module which contains other Modules, and applies them in sequence to
-# produce its output. Each Linear Module computes output from input using a
-# linear function, and holds internal Tensors for its weight and bias.
-model = torch.nn.Sequential(
-    torch.nn.Linear(D_in, H),
-    torch.nn.ReLU(),
-    torch.nn.Linear(H, D_out),
-)
-
-# The nn package also contains definitions of popular loss functions; in this
-# case we will use Mean Squared Error (MSE) as our loss function.
-loss_fn = torch.nn.MSELoss(reduction='sum')
-
-learning_rate = 1e-4
-for t in range(500):
-    # Forward pass: compute predicted y by passing x to the model. Module objects
-    # override the __call__ operator so you can call them like functions. When
-    # doing so you pass a Tensor of input data to the Module and it produces
-    # a Tensor of output data.
-    y_pred = model(x)
-
-    # Compute and print loss. We pass Tensors containing the predicted and true
-    # values of y, and the loss function returns a Tensor containing the
-    # loss.
-    loss = loss_fn(y_pred, y)
-    if t % 100 == 99:
-        print(t, loss.item())
-
-    # Zero the gradients before running the backward pass.
-    model.zero_grad()
-
-    # Backward pass: compute gradient of the loss with respect to all the learnable
-    # parameters of the model. Internally, the parameters of each Module are stored
-    # in Tensors with requires_grad=True, so this call will compute gradients for
-    # all learnable parameters in the model.
-    loss.backward()
-
-    # Update the weights using gradient descent. Each parameter is a Tensor, so
-    # we can access its gradients like we did before.
-    with torch.no_grad():
-        for param in model.parameters():
-            param -= learning_rate * param.grad
diff --git a/_downloads/42443af84e4770f8d5353f2c6e48f033/two_layer_net_tensor.py b/_downloads/42443af84e4770f8d5353f2c6e48f033/two_layer_net_tensor.py
deleted file mode 100644
index 3eacae42702..00000000000
--- a/_downloads/42443af84e4770f8d5353f2c6e48f033/two_layer_net_tensor.py
+++ /dev/null
@@ -1,62 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Tensors
-----------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation uses PyTorch tensors to manually compute the forward pass,
-loss, and backward pass.
-
-A PyTorch Tensor is basically the same as a numpy array: it does not know
-anything about deep learning or computational graphs or gradients, and is just
-a generic n-dimensional array to be used for arbitrary numeric computation.
-
-The biggest difference between a numpy array and a PyTorch Tensor is that
-a PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,
-just cast the Tensor to a cuda datatype.
-"""
-
-import torch
-
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0") # Uncomment this to run on GPU
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random input and output data
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Randomly initialize weights
-w1 = torch.randn(D_in, H, device=device, dtype=dtype)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y
-    h = x.mm(w1)
-    h_relu = h.clamp(min=0)
-    y_pred = h_relu.mm(w2)
-
-    # Compute and print loss
-    loss = (y_pred - y).pow(2).sum().item()
-    if t % 100 == 99:
-        print(t, loss)
-
-    # Backprop to compute gradients of w1 and w2 with respect to loss
-    grad_y_pred = 2.0 * (y_pred - y)
-    grad_w2 = h_relu.t().mm(grad_y_pred)
-    grad_h_relu = grad_y_pred.mm(w2.t())
-    grad_h = grad_h_relu.clone()
-    grad_h[h < 0] = 0
-    grad_w1 = x.t().mm(grad_h)
-
-    # Update weights using gradient descent
-    w1 -= learning_rate * grad_w1
-    w2 -= learning_rate * grad_w2
diff --git a/_downloads/445f984d6e8c379cf0aefd16ef44a4da/two_layer_net_numpy.py b/_downloads/445f984d6e8c379cf0aefd16ef44a4da/two_layer_net_numpy.py
deleted file mode 100644
index f003d0f002b..00000000000
--- a/_downloads/445f984d6e8c379cf0aefd16ef44a4da/two_layer_net_numpy.py
+++ /dev/null
@@ -1,51 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Warm-up: numpy
---------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x using Euclidean error.
-
-This implementation uses numpy to manually compute the forward pass, loss, and
-backward pass.
-
-A numpy array is a generic n-dimensional array; it does not know anything about
-deep learning or gradients or computational graphs, and is just a way to perform
-generic numeric computations.
-"""
-import numpy as np
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random input and output data
-x = np.random.randn(N, D_in)
-y = np.random.randn(N, D_out)
-
-# Randomly initialize weights
-w1 = np.random.randn(D_in, H)
-w2 = np.random.randn(H, D_out)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y
-    h = x.dot(w1)
-    h_relu = np.maximum(h, 0)
-    y_pred = h_relu.dot(w2)
-
-    # Compute and print loss
-    loss = np.square(y_pred - y).sum()
-    print(t, loss)
-
-    # Backprop to compute gradients of w1 and w2 with respect to loss
-    grad_y_pred = 2.0 * (y_pred - y)
-    grad_w2 = h_relu.T.dot(grad_y_pred)
-    grad_h_relu = grad_y_pred.dot(w2.T)
-    grad_h = grad_h_relu.copy()
-    grad_h[h < 0] = 0
-    grad_w1 = x.T.dot(grad_h)
-
-    # Update weights
-    w1 -= learning_rate * grad_w1
-    w2 -= learning_rate * grad_w2
diff --git a/_downloads/449b1270b788a2ddf451772f6a4e7470/two_layer_net_tensor.ipynb b/_downloads/449b1270b788a2ddf451772f6a4e7470/two_layer_net_tensor.ipynb
deleted file mode 100644
index da6e31bbc62..00000000000
--- a/_downloads/449b1270b788a2ddf451772f6a4e7470/two_layer_net_tensor.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Tensors\n----------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation uses PyTorch tensors to manually compute the forward pass,\nloss, and backward pass.\n\nA PyTorch Tensor is basically the same as a numpy array: it does not know\nanything about deep learning or computational graphs or gradients, and is just\na generic n-dimensional array to be used for arbitrary numeric computation.\n\nThe biggest difference between a numpy array and a PyTorch Tensor is that\na PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,\njust cast the Tensor to a cuda datatype.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\") # Uncomment this to run on GPU\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random input and output data\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Randomly initialize weights\nw1 = torch.randn(D_in, H, device=device, dtype=dtype)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y\n    h = x.mm(w1)\n    h_relu = h.clamp(min=0)\n    y_pred = h_relu.mm(w2)\n\n    # Compute and print loss\n    loss = (y_pred - y).pow(2).sum().item()\n    if t % 100 == 99:\n        print(t, loss)\n\n    # Backprop to compute gradients of w1 and w2 with respect to loss\n    grad_y_pred = 2.0 * (y_pred - y)\n    grad_w2 = h_relu.t().mm(grad_y_pred)\n    grad_h_relu = grad_y_pred.mm(w2.t())\n    grad_h = grad_h_relu.clone()\n    grad_h[h < 0] = 0\n    grad_w1 = x.t().mm(grad_h)\n\n    # Update weights using gradient descent\n    w1 -= learning_rate * grad_w1\n    w2 -= learning_rate * grad_w2"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/7df1a8d6c18d6c7122649856a1ac16b8/two_layer_net_custom_function.ipynb b/_downloads/7df1a8d6c18d6c7122649856a1ac16b8/two_layer_net_custom_function.ipynb
deleted file mode 100644
index b5502d22c59..00000000000
--- a/_downloads/7df1a8d6c18d6c7122649856a1ac16b8/two_layer_net_custom_function.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Defining New autograd Functions\n----------------------------------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation computes the forward pass using operations on PyTorch\nVariables, and uses PyTorch autograd to compute gradients.\n\nIn this implementation we implement our own custom autograd function to perform\nthe ReLU function.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\nclass MyReLU(torch.autograd.Function):\n    \"\"\"\n    We can implement our own custom autograd Functions by subclassing\n    torch.autograd.Function and implementing the forward and backward passes\n    which operate on Tensors.\n    \"\"\"\n\n    @staticmethod\n    def forward(ctx, input):\n        \"\"\"\n        In the forward pass we receive a Tensor containing the input and return\n        a Tensor containing the output. ctx is a context object that can be used\n        to stash information for backward computation. You can cache arbitrary\n        objects for use in the backward pass using the ctx.save_for_backward method.\n        \"\"\"\n        ctx.save_for_backward(input)\n        return input.clamp(min=0)\n\n    @staticmethod\n    def backward(ctx, grad_output):\n        \"\"\"\n        In the backward pass we receive a Tensor containing the gradient of the loss\n        with respect to the output, and we need to compute the gradient of the loss\n        with respect to the input.\n        \"\"\"\n        input, = ctx.saved_tensors\n        grad_input = grad_output.clone()\n        grad_input[input < 0] = 0\n        return grad_input\n\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\")  # Uncomment this to run on GPU\n# torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU\n\n# The above line disables TensorFloat32. This a feature that allows\n# networks to run at a much faster speed while sacrificing precision.\n# Although TensorFloat32 works well on most real models, for our toy model\n# in this tutorial, the sacrificed precision causes convergence issue.\n# For more information, see:\n# https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold input and outputs.\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Create random Tensors for weights.\nw1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # To apply our Function, we use Function.apply method. We alias this as 'relu'.\n    relu = MyReLU.apply\n\n    # Forward pass: compute predicted y using operations; we compute\n    # ReLU using our custom autograd operation.\n    y_pred = relu(x.mm(w1)).mm(w2)\n\n    # Compute and print loss\n    loss = (y_pred - y).pow(2).sum()\n    if t % 100 == 99:\n        print(t, loss.item())\n\n    # Use autograd to compute the backward pass.\n    loss.backward()\n\n    # Update weights using gradient descent\n    with torch.no_grad():\n        w1 -= learning_rate * w1.grad\n        w2 -= learning_rate * w2.grad\n\n        # Manually zero the gradients after updating weights\n        w1.grad.zero_()\n        w2.grad.zero_()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/7f1a8a2cb5a62c19268b29c5a0d7a859/two_layer_net_nn.ipynb b/_downloads/7f1a8a2cb5a62c19268b29c5a0d7a859/two_layer_net_nn.ipynb
deleted file mode 100644
index 6abfc0f9ddd..00000000000
--- a/_downloads/7f1a8a2cb5a62c19268b29c5a0d7a859/two_layer_net_nn.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: nn\n-----------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation uses the nn package from PyTorch to build the network.\nPyTorch autograd makes it easy to define computational graphs and take gradients,\nbut raw autograd can be a bit too low-level for defining complex neural networks;\nthis is where the nn package can help. The nn package defines a set of Modules,\nwhich you can think of as a neural network layer that has produces output from\ninput and may have some trainable weights.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Use the nn package to define our model as a sequence of layers. nn.Sequential\n# is a Module which contains other Modules, and applies them in sequence to\n# produce its output. Each Linear Module computes output from input using a\n# linear function, and holds internal Tensors for its weight and bias.\nmodel = torch.nn.Sequential(\n    torch.nn.Linear(D_in, H),\n    torch.nn.ReLU(),\n    torch.nn.Linear(H, D_out),\n)\n\n# The nn package also contains definitions of popular loss functions; in this\n# case we will use Mean Squared Error (MSE) as our loss function.\nloss_fn = torch.nn.MSELoss(reduction='sum')\n\nlearning_rate = 1e-4\nfor t in range(500):\n    # Forward pass: compute predicted y by passing x to the model. Module objects\n    # override the __call__ operator so you can call them like functions. When\n    # doing so you pass a Tensor of input data to the Module and it produces\n    # a Tensor of output data.\n    y_pred = model(x)\n\n    # Compute and print loss. We pass Tensors containing the predicted and true\n    # values of y, and the loss function returns a Tensor containing the\n    # loss.\n    loss = loss_fn(y_pred, y)\n    if t % 100 == 99:\n        print(t, loss.item())\n\n    # Zero the gradients before running the backward pass.\n    model.zero_grad()\n\n    # Backward pass: compute gradient of the loss with respect to all the learnable\n    # parameters of the model. Internally, the parameters of each Module are stored\n    # in Tensors with requires_grad=True, so this call will compute gradients for\n    # all learnable parameters in the model.\n    loss.backward()\n\n    # Update the weights using gradient descent. Each parameter is a Tensor, so\n    # we can access its gradients like we did before.\n    with torch.no_grad():\n        for param in model.parameters():\n            param -= learning_rate * param.grad"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/843ace305951b2a897f80a52e1189938/two_layer_net_module.ipynb b/_downloads/843ace305951b2a897f80a52e1189938/two_layer_net_module.ipynb
deleted file mode 100644
index 995ff4b376d..00000000000
--- a/_downloads/843ace305951b2a897f80a52e1189938/two_layer_net_module.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Custom nn Modules\n--------------------------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation defines the model as a custom Module subclass. Whenever you\nwant a model more complex than a simple sequence of existing Modules you will\nneed to define your model this way.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\nclass TwoLayerNet(torch.nn.Module):\n    def __init__(self, D_in, H, D_out):\n        \"\"\"\n        In the constructor we instantiate two nn.Linear modules and assign them as\n        member variables.\n        \"\"\"\n        super(TwoLayerNet, self).__init__()\n        self.linear1 = torch.nn.Linear(D_in, H)\n        self.linear2 = torch.nn.Linear(H, D_out)\n\n    def forward(self, x):\n        \"\"\"\n        In the forward function we accept a Tensor of input data and we must return\n        a Tensor of output data. We can use Modules defined in the constructor as\n        well as arbitrary operators on Tensors.\n        \"\"\"\n        h_relu = self.linear1(x).clamp(min=0)\n        y_pred = self.linear2(h_relu)\n        return y_pred\n\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Construct our model by instantiating the class defined above\nmodel = TwoLayerNet(D_in, H, D_out)\n\n# Construct our loss function and an Optimizer. The call to model.parameters()\n# in the SGD constructor will contain the learnable parameters of the two\n# nn.Linear modules which are members of the model.\ncriterion = torch.nn.MSELoss(reduction='sum')\noptimizer = torch.optim.SGD(model.parameters(), lr=1e-4)\nfor t in range(500):\n    # Forward pass: Compute predicted y by passing x to the model\n    y_pred = model(x)\n\n    # Compute and print loss\n    loss = criterion(y_pred, y)\n    if t % 100 == 99:\n        print(t, loss.item())\n\n    # Zero gradients, perform a backward pass, and update the weights.\n    optimizer.zero_grad()\n    loss.backward()\n    optimizer.step()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/a48ba4d15c30996aeba51337fb0c8dd7/two_layer_net_optim.ipynb b/_downloads/a48ba4d15c30996aeba51337fb0c8dd7/two_layer_net_optim.ipynb
deleted file mode 100644
index 202d7a49812..00000000000
--- a/_downloads/a48ba4d15c30996aeba51337fb0c8dd7/two_layer_net_optim.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: optim\n--------------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation uses the nn package from PyTorch to build the network.\n\nRather than manually updating the weights of the model as we have been doing,\nwe use the optim package to define an Optimizer that will update the weights\nfor us. The optim package defines many optimization algorithms that are commonly\nused for deep learning, including SGD+momentum, RMSProp, Adam, etc.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Use the nn package to define our model and loss function.\nmodel = torch.nn.Sequential(\n    torch.nn.Linear(D_in, H),\n    torch.nn.ReLU(),\n    torch.nn.Linear(H, D_out),\n)\nloss_fn = torch.nn.MSELoss(reduction='sum')\n\n# Use the optim package to define an Optimizer that will update the weights of\n# the model for us. Here we will use Adam; the optim package contains many other\n# optimization algorithms. The first argument to the Adam constructor tells the\n# optimizer which Tensors it should update.\nlearning_rate = 1e-4\noptimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\nfor t in range(500):\n    # Forward pass: compute predicted y by passing x to the model.\n    y_pred = model(x)\n\n    # Compute and print loss.\n    loss = loss_fn(y_pred, y)\n    if t % 100 == 99:\n        print(t, loss.item())\n\n    # Before the backward pass, use the optimizer object to zero all of the\n    # gradients for the variables it will update (which are the learnable\n    # weights of the model). This is because by default, gradients are\n    # accumulated in buffers( i.e, not overwritten) whenever .backward()\n    # is called. Checkout docs of torch.autograd.backward for more details.\n    optimizer.zero_grad()\n\n    # Backward pass: compute gradient of the loss with respect to model\n    # parameters\n    loss.backward()\n\n    # Calling the step function on an Optimizer makes an update to its\n    # parameters\n    optimizer.step()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/b8ed57e2c40a637d92a891b4cf7e72f6/two_layer_net_autograd.ipynb b/_downloads/b8ed57e2c40a637d92a891b4cf7e72f6/two_layer_net_autograd.ipynb
deleted file mode 100644
index 54cef9b61fa..00000000000
--- a/_downloads/b8ed57e2c40a637d92a891b4cf7e72f6/two_layer_net_autograd.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Tensors and autograd\n-------------------------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation computes the forward pass using operations on PyTorch\nTensors, and uses PyTorch autograd to compute gradients.\n\n\nA PyTorch Tensor represents a node in a computational graph. If ``x`` is a\nTensor that has ``x.requires_grad=True`` then ``x.grad`` is another Tensor\nholding the gradient of ``x`` with respect to some scalar value.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\")  # Uncomment this to run on GPU\n# torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU\n\n# The above line disables TensorFloat32. This a feature that allows\n# networks to run at a much faster speed while sacrificing precision.\n# Although TensorFloat32 works well on most real models, for our toy model\n# in this tutorial, the sacrificed precision causes convergence issue.\n# For more information, see:\n# https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold input and outputs.\n# Setting requires_grad=False indicates that we do not need to compute gradients\n# with respect to these Tensors during the backward pass.\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Create random Tensors for weights.\n# Setting requires_grad=True indicates that we want to compute gradients with\n# respect to these Tensors during the backward pass.\nw1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y using operations on Tensors; these\n    # are exactly the same operations we used to compute the forward pass using\n    # Tensors, but we do not need to keep references to intermediate values since\n    # we are not implementing the backward pass by hand.\n    y_pred = x.mm(w1).clamp(min=0).mm(w2)\n\n    # Compute and print loss using operations on Tensors.\n    # Now loss is a Tensor of shape (1,)\n    # loss.item() gets the scalar value held in the loss.\n    loss = (y_pred - y).pow(2).sum()\n    if t % 100 == 99:\n        print(t, loss.item())\n\n    # Use autograd to compute the backward pass. This call will compute the\n    # gradient of loss with respect to all Tensors with requires_grad=True.\n    # After this call w1.grad and w2.grad will be Tensors holding the gradient\n    # of the loss with respect to w1 and w2 respectively.\n    loss.backward()\n\n    # Manually update weights using gradient descent. Wrap in torch.no_grad()\n    # because weights have requires_grad=True, but we don't need to track this\n    # in autograd.\n    # An alternative way is to operate on weight.data and weight.grad.data.\n    # Recall that tensor.data gives a tensor that shares the storage with\n    # tensor, but doesn't track history.\n    # You can also use torch.optim.SGD to achieve this.\n    with torch.no_grad():\n        w1 -= learning_rate * w1.grad\n        w2 -= learning_rate * w2.grad\n\n        # Manually zero the gradients after updating weights\n        w1.grad.zero_()\n        w2.grad.zero_()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/e11b7a716744fc603445217d61ec787f/two_layer_net_autograd.py b/_downloads/e11b7a716744fc603445217d61ec787f/two_layer_net_autograd.py
deleted file mode 100644
index ebbc98b2bb8..00000000000
--- a/_downloads/e11b7a716744fc603445217d61ec787f/two_layer_net_autograd.py
+++ /dev/null
@@ -1,81 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Tensors and autograd
--------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Tensors, and uses PyTorch autograd to compute gradients.
-
-
-A PyTorch Tensor represents a node in a computational graph. If ``x`` is a
-Tensor that has ``x.requires_grad=True`` then ``x.grad`` is another Tensor
-holding the gradient of ``x`` with respect to some scalar value.
-"""
-import torch
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0")  # Uncomment this to run on GPU
-# torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU
-
-# The above line disables TensorFloat32. This a feature that allows
-# networks to run at a much faster speed while sacrificing precision.
-# Although TensorFloat32 works well on most real models, for our toy model
-# in this tutorial, the sacrificed precision causes convergence issue.
-# For more information, see:
-# https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold input and outputs.
-# Setting requires_grad=False indicates that we do not need to compute gradients
-# with respect to these Tensors during the backward pass.
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Create random Tensors for weights.
-# Setting requires_grad=True indicates that we want to compute gradients with
-# respect to these Tensors during the backward pass.
-w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y using operations on Tensors; these
-    # are exactly the same operations we used to compute the forward pass using
-    # Tensors, but we do not need to keep references to intermediate values since
-    # we are not implementing the backward pass by hand.
-    y_pred = x.mm(w1).clamp(min=0).mm(w2)
-
-    # Compute and print loss using operations on Tensors.
-    # Now loss is a Tensor of shape (1,)
-    # loss.item() gets the scalar value held in the loss.
-    loss = (y_pred - y).pow(2).sum()
-    if t % 100 == 99:
-        print(t, loss.item())
-
-    # Use autograd to compute the backward pass. This call will compute the
-    # gradient of loss with respect to all Tensors with requires_grad=True.
-    # After this call w1.grad and w2.grad will be Tensors holding the gradient
-    # of the loss with respect to w1 and w2 respectively.
-    loss.backward()
-
-    # Manually update weights using gradient descent. Wrap in torch.no_grad()
-    # because weights have requires_grad=True, but we don't need to track this
-    # in autograd.
-    # An alternative way is to operate on weight.data and weight.grad.data.
-    # Recall that tensor.data gives a tensor that shares the storage with
-    # tensor, but doesn't track history.
-    # You can also use torch.optim.SGD to achieve this.
-    with torch.no_grad():
-        w1 -= learning_rate * w1.grad
-        w2 -= learning_rate * w2.grad
-
-        # Manually zero the gradients after updating weights
-        w1.grad.zero_()
-        w2.grad.zero_()
diff --git a/_downloads/f00a2a1e490ec62f7c1bcb950318b7f7/two_layer_net_numpy.ipynb b/_downloads/f00a2a1e490ec62f7c1bcb950318b7f7/two_layer_net_numpy.ipynb
deleted file mode 100644
index 24d97015502..00000000000
--- a/_downloads/f00a2a1e490ec62f7c1bcb950318b7f7/two_layer_net_numpy.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nWarm-up: numpy\n--------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x using Euclidean error.\n\nThis implementation uses numpy to manually compute the forward pass, loss, and\nbackward pass.\n\nA numpy array is a generic n-dimensional array; it does not know anything about\ndeep learning or gradients or computational graphs, and is just a way to perform\ngeneric numeric computations.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import numpy as np\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random input and output data\nx = np.random.randn(N, D_in)\ny = np.random.randn(N, D_out)\n\n# Randomly initialize weights\nw1 = np.random.randn(D_in, H)\nw2 = np.random.randn(H, D_out)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y\n    h = x.dot(w1)\n    h_relu = np.maximum(h, 0)\n    y_pred = h_relu.dot(w2)\n\n    # Compute and print loss\n    loss = np.square(y_pred - y).sum()\n    print(t, loss)\n\n    # Backprop to compute gradients of w1 and w2 with respect to loss\n    grad_y_pred = 2.0 * (y_pred - y)\n    grad_w2 = h_relu.T.dot(grad_y_pred)\n    grad_h_relu = grad_y_pred.dot(w2.T)\n    grad_h = grad_h_relu.copy()\n    grad_h[h < 0] = 0\n    grad_w1 = x.T.dot(grad_h)\n\n    # Update weights\n    w1 -= learning_rate * grad_w1\n    w2 -= learning_rate * grad_w2"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.8"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/fa9717a4ee4117e114380fe627b1350c/two_layer_net_module.py b/_downloads/fa9717a4ee4117e114380fe627b1350c/two_layer_net_module.py
deleted file mode 100644
index 29d27274d25..00000000000
--- a/_downloads/fa9717a4ee4117e114380fe627b1350c/two_layer_net_module.py
+++ /dev/null
@@ -1,65 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Custom nn Modules
---------------------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation defines the model as a custom Module subclass. Whenever you
-want a model more complex than a simple sequence of existing Modules you will
-need to define your model this way.
-"""
-import torch
-
-
-class TwoLayerNet(torch.nn.Module):
-    def __init__(self, D_in, H, D_out):
-        """
-        In the constructor we instantiate two nn.Linear modules and assign them as
-        member variables.
-        """
-        super(TwoLayerNet, self).__init__()
-        self.linear1 = torch.nn.Linear(D_in, H)
-        self.linear2 = torch.nn.Linear(H, D_out)
-
-    def forward(self, x):
-        """
-        In the forward function we accept a Tensor of input data and we must return
-        a Tensor of output data. We can use Modules defined in the constructor as
-        well as arbitrary operators on Tensors.
-        """
-        h_relu = self.linear1(x).clamp(min=0)
-        y_pred = self.linear2(h_relu)
-        return y_pred
-
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Construct our model by instantiating the class defined above
-model = TwoLayerNet(D_in, H, D_out)
-
-# Construct our loss function and an Optimizer. The call to model.parameters()
-# in the SGD constructor will contain the learnable parameters of the two
-# nn.Linear modules which are members of the model.
-criterion = torch.nn.MSELoss(reduction='sum')
-optimizer = torch.optim.SGD(model.parameters(), lr=1e-4)
-for t in range(500):
-    # Forward pass: Compute predicted y by passing x to the model
-    y_pred = model(x)
-
-    # Compute and print loss
-    loss = criterion(y_pred, y)
-    if t % 100 == 99:
-        print(t, loss.item())
-
-    # Zero gradients, perform a backward pass, and update the weights.
-    optimizer.zero_grad()
-    loss.backward()
-    optimizer.step()
diff --git a/_downloads/two_layer_net_autograd.ipynb b/_downloads/two_layer_net_autograd.ipynb
deleted file mode 100644
index a776bf7f45b..00000000000
--- a/_downloads/two_layer_net_autograd.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Tensors and autograd\n-------------------------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation computes the forward pass using operations on PyTorch\nTensors, and uses PyTorch autograd to compute gradients.\n\n\nA PyTorch Tensor represents a node in a computational graph. If ``x`` is a\nTensor that has ``x.requires_grad=True`` then ``x.grad`` is another Tensor\nholding the gradient of ``x`` with respect to some scalar value.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\") # Uncomment this to run on GPU\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold input and outputs.\n# Setting requires_grad=False indicates that we do not need to compute gradients\n# with respect to these Tensors during the backward pass.\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Create random Tensors for weights.\n# Setting requires_grad=True indicates that we want to compute gradients with\n# respect to these Tensors during the backward pass.\nw1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y using operations on Tensors; these\n    # are exactly the same operations we used to compute the forward pass using\n    # Tensors, but we do not need to keep references to intermediate values since\n    # we are not implementing the backward pass by hand.\n    y_pred = x.mm(w1).clamp(min=0).mm(w2)\n\n    # Compute and print loss using operations on Tensors.\n    # Now loss is a Tensor of shape (1,)\n    # loss.item() gets the a scalar value held in the loss.\n    loss = (y_pred - y).pow(2).sum()\n    print(t, loss.item())\n\n    # Use autograd to compute the backward pass. This call will compute the\n    # gradient of loss with respect to all Tensors with requires_grad=True.\n    # After this call w1.grad and w2.grad will be Tensors holding the gradient\n    # of the loss with respect to w1 and w2 respectively.\n    loss.backward()\n\n    # Manually update weights using gradient descent. Wrap in torch.no_grad()\n    # because weights have requires_grad=True, but we don't need to track this\n    # in autograd.\n    # An alternative way is to operate on weight.data and weight.grad.data.\n    # Recall that tensor.data gives a tensor that shares the storage with\n    # tensor, but doesn't track history.\n    # You can also use torch.optim.SGD to achieve this.\n    with torch.no_grad():\n        w1 -= learning_rate * w1.grad\n        w2 -= learning_rate * w2.grad\n\n        # Manually zero the gradients after updating weights\n        w1.grad.zero_()\n        w2.grad.zero_()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_autograd.py b/_downloads/two_layer_net_autograd.py
deleted file mode 100644
index beab57a9afb..00000000000
--- a/_downloads/two_layer_net_autograd.py
+++ /dev/null
@@ -1,72 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Tensors and autograd
--------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Tensors, and uses PyTorch autograd to compute gradients.
-
-
-A PyTorch Tensor represents a node in a computational graph. If ``x`` is a
-Tensor that has ``x.requires_grad=True`` then ``x.grad`` is another Tensor
-holding the gradient of ``x`` with respect to some scalar value.
-"""
-import torch
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0") # Uncomment this to run on GPU
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold input and outputs.
-# Setting requires_grad=False indicates that we do not need to compute gradients
-# with respect to these Tensors during the backward pass.
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Create random Tensors for weights.
-# Setting requires_grad=True indicates that we want to compute gradients with
-# respect to these Tensors during the backward pass.
-w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y using operations on Tensors; these
-    # are exactly the same operations we used to compute the forward pass using
-    # Tensors, but we do not need to keep references to intermediate values since
-    # we are not implementing the backward pass by hand.
-    y_pred = x.mm(w1).clamp(min=0).mm(w2)
-
-    # Compute and print loss using operations on Tensors.
-    # Now loss is a Tensor of shape (1,)
-    # loss.item() gets the a scalar value held in the loss.
-    loss = (y_pred - y).pow(2).sum()
-    print(t, loss.item())
-
-    # Use autograd to compute the backward pass. This call will compute the
-    # gradient of loss with respect to all Tensors with requires_grad=True.
-    # After this call w1.grad and w2.grad will be Tensors holding the gradient
-    # of the loss with respect to w1 and w2 respectively.
-    loss.backward()
-
-    # Manually update weights using gradient descent. Wrap in torch.no_grad()
-    # because weights have requires_grad=True, but we don't need to track this
-    # in autograd.
-    # An alternative way is to operate on weight.data and weight.grad.data.
-    # Recall that tensor.data gives a tensor that shares the storage with
-    # tensor, but doesn't track history.
-    # You can also use torch.optim.SGD to achieve this.
-    with torch.no_grad():
-        w1 -= learning_rate * w1.grad
-        w2 -= learning_rate * w2.grad
-
-        # Manually zero the gradients after updating weights
-        w1.grad.zero_()
-        w2.grad.zero_()
diff --git a/_downloads/two_layer_net_custom_function.ipynb b/_downloads/two_layer_net_custom_function.ipynb
deleted file mode 100644
index 01e761ba7de..00000000000
--- a/_downloads/two_layer_net_custom_function.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Defining New autograd Functions\n----------------------------------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation computes the forward pass using operations on PyTorch\nVariables, and uses PyTorch autograd to compute gradients.\n\nIn this implementation we implement our own custom autograd function to perform\nthe ReLU function.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\nclass MyReLU(torch.autograd.Function):\n    \"\"\"\n    We can implement our own custom autograd Functions by subclassing\n    torch.autograd.Function and implementing the forward and backward passes\n    which operate on Tensors.\n    \"\"\"\n\n    @staticmethod\n    def forward(ctx, input):\n        \"\"\"\n        In the forward pass we receive a Tensor containing the input and return\n        a Tensor containing the output. ctx is a context object that can be used\n        to stash information for backward computation. You can cache arbitrary\n        objects for use in the backward pass using the ctx.save_for_backward method.\n        \"\"\"\n        ctx.save_for_backward(input)\n        return input.clamp(min=0)\n\n    @staticmethod\n    def backward(ctx, grad_output):\n        \"\"\"\n        In the backward pass we receive a Tensor containing the gradient of the loss\n        with respect to the output, and we need to compute the gradient of the loss\n        with respect to the input.\n        \"\"\"\n        input, = ctx.saved_tensors\n        grad_input = grad_output.clone()\n        grad_input[input < 0] = 0\n        return grad_input\n\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\") # Uncomment this to run on GPU\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold input and outputs.\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Create random Tensors for weights.\nw1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # To apply our Function, we use Function.apply method. We alias this as 'relu'.\n    relu = MyReLU.apply\n\n    # Forward pass: compute predicted y using operations; we compute\n    # ReLU using our custom autograd operation.\n    y_pred = relu(x.mm(w1)).mm(w2)\n\n    # Compute and print loss\n    loss = (y_pred - y).pow(2).sum()\n    print(t, loss.item())\n\n    # Use autograd to compute the backward pass.\n    loss.backward()\n\n    # Update weights using gradient descent\n    with torch.no_grad():\n        w1 -= learning_rate * w1.grad\n        w2 -= learning_rate * w2.grad\n\n        # Manually zero the gradients after updating weights\n        w1.grad.zero_()\n        w2.grad.zero_()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_custom_function.py b/_downloads/two_layer_net_custom_function.py
deleted file mode 100644
index fc4452c53a0..00000000000
--- a/_downloads/two_layer_net_custom_function.py
+++ /dev/null
@@ -1,88 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Defining New autograd Functions
-----------------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Variables, and uses PyTorch autograd to compute gradients.
-
-In this implementation we implement our own custom autograd function to perform
-the ReLU function.
-"""
-import torch
-
-
-class MyReLU(torch.autograd.Function):
-    """
-    We can implement our own custom autograd Functions by subclassing
-    torch.autograd.Function and implementing the forward and backward passes
-    which operate on Tensors.
-    """
-
-    @staticmethod
-    def forward(ctx, input):
-        """
-        In the forward pass we receive a Tensor containing the input and return
-        a Tensor containing the output. ctx is a context object that can be used
-        to stash information for backward computation. You can cache arbitrary
-        objects for use in the backward pass using the ctx.save_for_backward method.
-        """
-        ctx.save_for_backward(input)
-        return input.clamp(min=0)
-
-    @staticmethod
-    def backward(ctx, grad_output):
-        """
-        In the backward pass we receive a Tensor containing the gradient of the loss
-        with respect to the output, and we need to compute the gradient of the loss
-        with respect to the input.
-        """
-        input, = ctx.saved_tensors
-        grad_input = grad_output.clone()
-        grad_input[input < 0] = 0
-        return grad_input
-
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0") # Uncomment this to run on GPU
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold input and outputs.
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Create random Tensors for weights.
-w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-learning_rate = 1e-6
-for t in range(500):
-    # To apply our Function, we use Function.apply method. We alias this as 'relu'.
-    relu = MyReLU.apply
-
-    # Forward pass: compute predicted y using operations; we compute
-    # ReLU using our custom autograd operation.
-    y_pred = relu(x.mm(w1)).mm(w2)
-
-    # Compute and print loss
-    loss = (y_pred - y).pow(2).sum()
-    print(t, loss.item())
-
-    # Use autograd to compute the backward pass.
-    loss.backward()
-
-    # Update weights using gradient descent
-    with torch.no_grad():
-        w1 -= learning_rate * w1.grad
-        w2 -= learning_rate * w2.grad
-
-        # Manually zero the gradients after updating weights
-        w1.grad.zero_()
-        w2.grad.zero_()
diff --git a/_downloads/two_layer_net_module.ipynb b/_downloads/two_layer_net_module.ipynb
deleted file mode 100644
index 4b0d4ac9aff..00000000000
--- a/_downloads/two_layer_net_module.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Custom nn Modules\n--------------------------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation defines the model as a custom Module subclass. Whenever you\nwant a model more complex than a simple sequence of existing Modules you will\nneed to define your model this way.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\nclass TwoLayerNet(torch.nn.Module):\n    def __init__(self, D_in, H, D_out):\n        \"\"\"\n        In the constructor we instantiate two nn.Linear modules and assign them as\n        member variables.\n        \"\"\"\n        super(TwoLayerNet, self).__init__()\n        self.linear1 = torch.nn.Linear(D_in, H)\n        self.linear2 = torch.nn.Linear(H, D_out)\n\n    def forward(self, x):\n        \"\"\"\n        In the forward function we accept a Tensor of input data and we must return\n        a Tensor of output data. We can use Modules defined in the constructor as\n        well as arbitrary operators on Tensors.\n        \"\"\"\n        h_relu = self.linear1(x).clamp(min=0)\n        y_pred = self.linear2(h_relu)\n        return y_pred\n\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Construct our model by instantiating the class defined above\nmodel = TwoLayerNet(D_in, H, D_out)\n\n# Construct our loss function and an Optimizer. The call to model.parameters()\n# in the SGD constructor will contain the learnable parameters of the two\n# nn.Linear modules which are members of the model.\ncriterion = torch.nn.MSELoss(reduction='sum')\noptimizer = torch.optim.SGD(model.parameters(), lr=1e-4)\nfor t in range(500):\n    # Forward pass: Compute predicted y by passing x to the model\n    y_pred = model(x)\n\n    # Compute and print loss\n    loss = criterion(y_pred, y)\n    print(t, loss.item())\n\n    # Zero gradients, perform a backward pass, and update the weights.\n    optimizer.zero_grad()\n    loss.backward()\n    optimizer.step()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_module.py b/_downloads/two_layer_net_module.py
deleted file mode 100644
index bf010efc05c..00000000000
--- a/_downloads/two_layer_net_module.py
+++ /dev/null
@@ -1,64 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Custom nn Modules
---------------------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation defines the model as a custom Module subclass. Whenever you
-want a model more complex than a simple sequence of existing Modules you will
-need to define your model this way.
-"""
-import torch
-
-
-class TwoLayerNet(torch.nn.Module):
-    def __init__(self, D_in, H, D_out):
-        """
-        In the constructor we instantiate two nn.Linear modules and assign them as
-        member variables.
-        """
-        super(TwoLayerNet, self).__init__()
-        self.linear1 = torch.nn.Linear(D_in, H)
-        self.linear2 = torch.nn.Linear(H, D_out)
-
-    def forward(self, x):
-        """
-        In the forward function we accept a Tensor of input data and we must return
-        a Tensor of output data. We can use Modules defined in the constructor as
-        well as arbitrary operators on Tensors.
-        """
-        h_relu = self.linear1(x).clamp(min=0)
-        y_pred = self.linear2(h_relu)
-        return y_pred
-
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Construct our model by instantiating the class defined above
-model = TwoLayerNet(D_in, H, D_out)
-
-# Construct our loss function and an Optimizer. The call to model.parameters()
-# in the SGD constructor will contain the learnable parameters of the two
-# nn.Linear modules which are members of the model.
-criterion = torch.nn.MSELoss(reduction='sum')
-optimizer = torch.optim.SGD(model.parameters(), lr=1e-4)
-for t in range(500):
-    # Forward pass: Compute predicted y by passing x to the model
-    y_pred = model(x)
-
-    # Compute and print loss
-    loss = criterion(y_pred, y)
-    print(t, loss.item())
-
-    # Zero gradients, perform a backward pass, and update the weights.
-    optimizer.zero_grad()
-    loss.backward()
-    optimizer.step()
diff --git a/_downloads/two_layer_net_nn.ipynb b/_downloads/two_layer_net_nn.ipynb
deleted file mode 100644
index c0807c9bfcc..00000000000
--- a/_downloads/two_layer_net_nn.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: nn\n-----------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation uses the nn package from PyTorch to build the network.\nPyTorch autograd makes it easy to define computational graphs and take gradients,\nbut raw autograd can be a bit too low-level for defining complex neural networks;\nthis is where the nn package can help. The nn package defines a set of Modules,\nwhich you can think of as a neural network layer that has produces output from\ninput and may have some trainable weights.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Use the nn package to define our model as a sequence of layers. nn.Sequential\n# is a Module which contains other Modules, and applies them in sequence to\n# produce its output. Each Linear Module computes output from input using a\n# linear function, and holds internal Tensors for its weight and bias.\nmodel = torch.nn.Sequential(\n    torch.nn.Linear(D_in, H),\n    torch.nn.ReLU(),\n    torch.nn.Linear(H, D_out),\n)\n\n# The nn package also contains definitions of popular loss functions; in this\n# case we will use Mean Squared Error (MSE) as our loss function.\nloss_fn = torch.nn.MSELoss(reduction='sum')\n\nlearning_rate = 1e-4\nfor t in range(500):\n    # Forward pass: compute predicted y by passing x to the model. Module objects\n    # override the __call__ operator so you can call them like functions. When\n    # doing so you pass a Tensor of input data to the Module and it produces\n    # a Tensor of output data.\n    y_pred = model(x)\n\n    # Compute and print loss. We pass Tensors containing the predicted and true\n    # values of y, and the loss function returns a Tensor containing the\n    # loss.\n    loss = loss_fn(y_pred, y)\n    print(t, loss.item())\n\n    # Zero the gradients before running the backward pass.\n    model.zero_grad()\n\n    # Backward pass: compute gradient of the loss with respect to all the learnable\n    # parameters of the model. Internally, the parameters of each Module are stored\n    # in Tensors with requires_grad=True, so this call will compute gradients for\n    # all learnable parameters in the model.\n    loss.backward()\n\n    # Update the weights using gradient descent. Each parameter is a Tensor, so\n    # we can access its gradients like we did before.\n    with torch.no_grad():\n        for param in model.parameters():\n            param -= learning_rate * param.grad"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_nn.py b/_downloads/two_layer_net_nn.py
deleted file mode 100644
index 51bf623b01b..00000000000
--- a/_downloads/two_layer_net_nn.py
+++ /dev/null
@@ -1,67 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: nn
------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-PyTorch autograd makes it easy to define computational graphs and take gradients,
-but raw autograd can be a bit too low-level for defining complex neural networks;
-this is where the nn package can help. The nn package defines a set of Modules,
-which you can think of as a neural network layer that has produces output from
-input and may have some trainable weights.
-"""
-import torch
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Use the nn package to define our model as a sequence of layers. nn.Sequential
-# is a Module which contains other Modules, and applies them in sequence to
-# produce its output. Each Linear Module computes output from input using a
-# linear function, and holds internal Tensors for its weight and bias.
-model = torch.nn.Sequential(
-    torch.nn.Linear(D_in, H),
-    torch.nn.ReLU(),
-    torch.nn.Linear(H, D_out),
-)
-
-# The nn package also contains definitions of popular loss functions; in this
-# case we will use Mean Squared Error (MSE) as our loss function.
-loss_fn = torch.nn.MSELoss(reduction='sum')
-
-learning_rate = 1e-4
-for t in range(500):
-    # Forward pass: compute predicted y by passing x to the model. Module objects
-    # override the __call__ operator so you can call them like functions. When
-    # doing so you pass a Tensor of input data to the Module and it produces
-    # a Tensor of output data.
-    y_pred = model(x)
-
-    # Compute and print loss. We pass Tensors containing the predicted and true
-    # values of y, and the loss function returns a Tensor containing the
-    # loss.
-    loss = loss_fn(y_pred, y)
-    print(t, loss.item())
-
-    # Zero the gradients before running the backward pass.
-    model.zero_grad()
-
-    # Backward pass: compute gradient of the loss with respect to all the learnable
-    # parameters of the model. Internally, the parameters of each Module are stored
-    # in Tensors with requires_grad=True, so this call will compute gradients for
-    # all learnable parameters in the model.
-    loss.backward()
-
-    # Update the weights using gradient descent. Each parameter is a Tensor, so
-    # we can access its gradients like we did before.
-    with torch.no_grad():
-        for param in model.parameters():
-            param -= learning_rate * param.grad
diff --git a/_downloads/two_layer_net_numpy.ipynb b/_downloads/two_layer_net_numpy.ipynb
deleted file mode 100644
index 4b9cdd79bd0..00000000000
--- a/_downloads/two_layer_net_numpy.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nWarm-up: numpy\n--------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x using Euclidean error.\n\nThis implementation uses numpy to manually compute the forward pass, loss, and\nbackward pass.\n\nA numpy array is a generic n-dimensional array; it does not know anything about\ndeep learning or gradients or computational graphs, and is just a way to perform\ngeneric numeric computations.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import numpy as np\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random input and output data\nx = np.random.randn(N, D_in)\ny = np.random.randn(N, D_out)\n\n# Randomly initialize weights\nw1 = np.random.randn(D_in, H)\nw2 = np.random.randn(H, D_out)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y\n    h = x.dot(w1)\n    h_relu = np.maximum(h, 0)\n    y_pred = h_relu.dot(w2)\n\n    # Compute and print loss\n    loss = np.square(y_pred - y).sum()\n    print(t, loss)\n\n    # Backprop to compute gradients of w1 and w2 with respect to loss\n    grad_y_pred = 2.0 * (y_pred - y)\n    grad_w2 = h_relu.T.dot(grad_y_pred)\n    grad_h_relu = grad_y_pred.dot(w2.T)\n    grad_h = grad_h_relu.copy()\n    grad_h[h < 0] = 0\n    grad_w1 = x.T.dot(grad_h)\n\n    # Update weights\n    w1 -= learning_rate * grad_w1\n    w2 -= learning_rate * grad_w2"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_numpy.py b/_downloads/two_layer_net_numpy.py
deleted file mode 100644
index f003d0f002b..00000000000
--- a/_downloads/two_layer_net_numpy.py
+++ /dev/null
@@ -1,51 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-Warm-up: numpy
---------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x using Euclidean error.
-
-This implementation uses numpy to manually compute the forward pass, loss, and
-backward pass.
-
-A numpy array is a generic n-dimensional array; it does not know anything about
-deep learning or gradients or computational graphs, and is just a way to perform
-generic numeric computations.
-"""
-import numpy as np
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random input and output data
-x = np.random.randn(N, D_in)
-y = np.random.randn(N, D_out)
-
-# Randomly initialize weights
-w1 = np.random.randn(D_in, H)
-w2 = np.random.randn(H, D_out)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y
-    h = x.dot(w1)
-    h_relu = np.maximum(h, 0)
-    y_pred = h_relu.dot(w2)
-
-    # Compute and print loss
-    loss = np.square(y_pred - y).sum()
-    print(t, loss)
-
-    # Backprop to compute gradients of w1 and w2 with respect to loss
-    grad_y_pred = 2.0 * (y_pred - y)
-    grad_w2 = h_relu.T.dot(grad_y_pred)
-    grad_h_relu = grad_y_pred.dot(w2.T)
-    grad_h = grad_h_relu.copy()
-    grad_h[h < 0] = 0
-    grad_w1 = x.T.dot(grad_h)
-
-    # Update weights
-    w1 -= learning_rate * grad_w1
-    w2 -= learning_rate * grad_w2
diff --git a/_downloads/two_layer_net_optim.ipynb b/_downloads/two_layer_net_optim.ipynb
deleted file mode 100644
index 24f2091e161..00000000000
--- a/_downloads/two_layer_net_optim.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: optim\n--------------\n\nA fully-connected ReLU network with one hidden layer, trained to predict y from x\nby minimizing squared Euclidean distance.\n\nThis implementation uses the nn package from PyTorch to build the network.\n\nRather than manually updating the weights of the model as we have been doing,\nwe use the optim package to define an Optimizer that will update the weights\nfor us. The optim package defines many optimization algorithms that are commonly\nused for deep learning, including SGD+momentum, RMSProp, Adam, etc.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random Tensors to hold inputs and outputs\nx = torch.randn(N, D_in)\ny = torch.randn(N, D_out)\n\n# Use the nn package to define our model and loss function.\nmodel = torch.nn.Sequential(\n    torch.nn.Linear(D_in, H),\n    torch.nn.ReLU(),\n    torch.nn.Linear(H, D_out),\n)\nloss_fn = torch.nn.MSELoss(reduction='sum')\n\n# Use the optim package to define an Optimizer that will update the weights of\n# the model for us. Here we will use Adam; the optim package contains many other\n# optimization algoriths. The first argument to the Adam constructor tells the\n# optimizer which Tensors it should update.\nlearning_rate = 1e-4\noptimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\nfor t in range(500):\n    # Forward pass: compute predicted y by passing x to the model.\n    y_pred = model(x)\n\n    # Compute and print loss.\n    loss = loss_fn(y_pred, y)\n    print(t, loss.item())\n\n    # Before the backward pass, use the optimizer object to zero all of the\n    # gradients for the variables it will update (which are the learnable\n    # weights of the model). This is because by default, gradients are\n    # accumulated in buffers( i.e, not overwritten) whenever .backward()\n    # is called. Checkout docs of torch.autograd.backward for more details.\n    optimizer.zero_grad()\n\n    # Backward pass: compute gradient of the loss with respect to model\n    # parameters\n    loss.backward()\n\n    # Calling the step function on an Optimizer makes an update to its\n    # parameters\n    optimizer.step()"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_optim.py b/_downloads/two_layer_net_optim.py
deleted file mode 100644
index 62c44cd0911..00000000000
--- a/_downloads/two_layer_net_optim.py
+++ /dev/null
@@ -1,61 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: optim
---------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-
-Rather than manually updating the weights of the model as we have been doing,
-we use the optim package to define an Optimizer that will update the weights
-for us. The optim package defines many optimization algorithms that are commonly
-used for deep learning, including SGD+momentum, RMSProp, Adam, etc.
-"""
-import torch
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random Tensors to hold inputs and outputs
-x = torch.randn(N, D_in)
-y = torch.randn(N, D_out)
-
-# Use the nn package to define our model and loss function.
-model = torch.nn.Sequential(
-    torch.nn.Linear(D_in, H),
-    torch.nn.ReLU(),
-    torch.nn.Linear(H, D_out),
-)
-loss_fn = torch.nn.MSELoss(reduction='sum')
-
-# Use the optim package to define an Optimizer that will update the weights of
-# the model for us. Here we will use Adam; the optim package contains many other
-# optimization algoriths. The first argument to the Adam constructor tells the
-# optimizer which Tensors it should update.
-learning_rate = 1e-4
-optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
-for t in range(500):
-    # Forward pass: compute predicted y by passing x to the model.
-    y_pred = model(x)
-
-    # Compute and print loss.
-    loss = loss_fn(y_pred, y)
-    print(t, loss.item())
-
-    # Before the backward pass, use the optimizer object to zero all of the
-    # gradients for the variables it will update (which are the learnable
-    # weights of the model). This is because by default, gradients are
-    # accumulated in buffers( i.e, not overwritten) whenever .backward()
-    # is called. Checkout docs of torch.autograd.backward for more details.
-    optimizer.zero_grad()
-
-    # Backward pass: compute gradient of the loss with respect to model
-    # parameters
-    loss.backward()
-
-    # Calling the step function on an Optimizer makes an update to its
-    # parameters
-    optimizer.step()
diff --git a/_downloads/two_layer_net_tensor.ipynb b/_downloads/two_layer_net_tensor.ipynb
deleted file mode 100644
index 26020422b15..00000000000
--- a/_downloads/two_layer_net_tensor.ipynb
+++ /dev/null
@@ -1,54 +0,0 @@
-{
-  "cells": [
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "%matplotlib inline"
-      ]
-    },
-    {
-      "cell_type": "markdown",
-      "metadata": {},
-      "source": [
-        "\nPyTorch: Tensors\n----------------\n\nA fully-connected ReLU network with one hidden layer and no biases, trained to\npredict y from x by minimizing squared Euclidean distance.\n\nThis implementation uses PyTorch tensors to manually compute the forward pass,\nloss, and backward pass.\n\nA PyTorch Tensor is basically the same as a numpy array: it does not know\nanything about deep learning or computational graphs or gradients, and is just\na generic n-dimensional array to be used for arbitrary numeric computation.\n\nThe biggest difference between a numpy array and a PyTorch Tensor is that\na PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,\njust cast the Tensor to a cuda datatype.\n\n"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "execution_count": null,
-      "metadata": {
-        "collapsed": false
-      },
-      "outputs": [],
-      "source": [
-        "import torch\n\n\ndtype = torch.float\ndevice = torch.device(\"cpu\")\n# device = torch.device(\"cuda:0\") # Uncomment this to run on GPU\n\n# N is batch size; D_in is input dimension;\n# H is hidden dimension; D_out is output dimension.\nN, D_in, H, D_out = 64, 1000, 100, 10\n\n# Create random input and output data\nx = torch.randn(N, D_in, device=device, dtype=dtype)\ny = torch.randn(N, D_out, device=device, dtype=dtype)\n\n# Randomly initialize weights\nw1 = torch.randn(D_in, H, device=device, dtype=dtype)\nw2 = torch.randn(H, D_out, device=device, dtype=dtype)\n\nlearning_rate = 1e-6\nfor t in range(500):\n    # Forward pass: compute predicted y\n    h = x.mm(w1)\n    h_relu = h.clamp(min=0)\n    y_pred = h_relu.mm(w2)\n\n    # Compute and print loss\n    loss = (y_pred - y).pow(2).sum().item()\n    print(t, loss)\n\n    # Backprop to compute gradients of w1 and w2 with respect to loss\n    grad_y_pred = 2.0 * (y_pred - y)\n    grad_w2 = h_relu.t().mm(grad_y_pred)\n    grad_h_relu = grad_y_pred.mm(w2.t())\n    grad_h = grad_h_relu.clone()\n    grad_h[h < 0] = 0\n    grad_w1 = x.t().mm(grad_h)\n\n    # Update weights using gradient descent\n    w1 -= learning_rate * grad_w1\n    w2 -= learning_rate * grad_w2"
-      ]
-    }
-  ],
-  "metadata": {
-    "kernelspec": {
-      "display_name": "Python 3",
-      "language": "python",
-      "name": "python3"
-    },
-    "language_info": {
-      "codemirror_mode": {
-        "name": "ipython",
-        "version": 3
-      },
-      "file_extension": ".py",
-      "mimetype": "text/x-python",
-      "name": "python",
-      "nbconvert_exporter": "python",
-      "pygments_lexer": "ipython3",
-      "version": "3.6.6"
-    }
-  },
-  "nbformat": 4,
-  "nbformat_minor": 0
-}
\ No newline at end of file
diff --git a/_downloads/two_layer_net_tensor.py b/_downloads/two_layer_net_tensor.py
deleted file mode 100644
index e3cb4949bbf..00000000000
--- a/_downloads/two_layer_net_tensor.py
+++ /dev/null
@@ -1,61 +0,0 @@
-# -*- coding: utf-8 -*-
-"""
-PyTorch: Tensors
-----------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation uses PyTorch tensors to manually compute the forward pass,
-loss, and backward pass.
-
-A PyTorch Tensor is basically the same as a numpy array: it does not know
-anything about deep learning or computational graphs or gradients, and is just
-a generic n-dimensional array to be used for arbitrary numeric computation.
-
-The biggest difference between a numpy array and a PyTorch Tensor is that
-a PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,
-just cast the Tensor to a cuda datatype.
-"""
-
-import torch
-
-
-dtype = torch.float
-device = torch.device("cpu")
-# device = torch.device("cuda:0") # Uncomment this to run on GPU
-
-# N is batch size; D_in is input dimension;
-# H is hidden dimension; D_out is output dimension.
-N, D_in, H, D_out = 64, 1000, 100, 10
-
-# Create random input and output data
-x = torch.randn(N, D_in, device=device, dtype=dtype)
-y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-# Randomly initialize weights
-w1 = torch.randn(D_in, H, device=device, dtype=dtype)
-w2 = torch.randn(H, D_out, device=device, dtype=dtype)
-
-learning_rate = 1e-6
-for t in range(500):
-    # Forward pass: compute predicted y
-    h = x.mm(w1)
-    h_relu = h.clamp(min=0)
-    y_pred = h_relu.mm(w2)
-
-    # Compute and print loss
-    loss = (y_pred - y).pow(2).sum().item()
-    print(t, loss)
-
-    # Backprop to compute gradients of w1 and w2 with respect to loss
-    grad_y_pred = 2.0 * (y_pred - y)
-    grad_w2 = h_relu.t().mm(grad_y_pred)
-    grad_h_relu = grad_y_pred.mm(w2.t())
-    grad_h = grad_h_relu.clone()
-    grad_h[h < 0] = 0
-    grad_w1 = x.t().mm(grad_h)
-
-    # Update weights using gradient descent
-    w1 -= learning_rate * grad_w1
-    w2 -= learning_rate * grad_w2
diff --git a/_images/sphx_glr_two_layer_net_autograd_thumb.png b/_images/sphx_glr_two_layer_net_autograd_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_autograd_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_custom_function_thumb.png b/_images/sphx_glr_two_layer_net_custom_function_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_custom_function_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_module_thumb.png b/_images/sphx_glr_two_layer_net_module_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_module_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_nn_thumb.png b/_images/sphx_glr_two_layer_net_nn_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_nn_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_numpy_thumb.png b/_images/sphx_glr_two_layer_net_numpy_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_numpy_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_optim_thumb.png b/_images/sphx_glr_two_layer_net_optim_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_optim_thumb.png and /dev/null differ
diff --git a/_images/sphx_glr_two_layer_net_tensor_thumb.png b/_images/sphx_glr_two_layer_net_tensor_thumb.png
deleted file mode 100644
index 233f8e605ef..00000000000
Binary files a/_images/sphx_glr_two_layer_net_tensor_thumb.png and /dev/null differ
diff --git a/_sources/beginner/examples_autograd/two_layer_net_autograd.rst.txt b/_sources/beginner/examples_autograd/two_layer_net_autograd.rst.txt
deleted file mode 100644
index db61d44aa15..00000000000
--- a/_sources/beginner/examples_autograd/two_layer_net_autograd.rst.txt
+++ /dev/null
@@ -1,124 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_autograd_two_layer_net_autograd.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_autograd_two_layer_net_autograd.py:
-
-
-PyTorch: Tensors and autograd
--------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Tensors, and uses PyTorch autograd to compute gradients.
-
-
-A PyTorch Tensor represents a node in a computational graph. If ``x`` is a
-Tensor that has ``x.requires_grad=True`` then ``x.grad`` is another Tensor
-holding the gradient of ``x`` with respect to some scalar value.
-
-
-.. code-block:: default
-
-    import torch
-
-    dtype = torch.float
-    device = torch.device("cpu")
-    # device = torch.device("cuda:0")  # Uncomment this to run on GPU
-    # torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU
-
-    # The above line disables TensorFloat32. This a feature that allows
-    # networks to run at a much faster speed while sacrificing precision.
-    # Although TensorFloat32 works well on most real models, for our toy model
-    # in this tutorial, the sacrificed precision causes convergence issue.
-    # For more information, see:
-    # https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random Tensors to hold input and outputs.
-    # Setting requires_grad=False indicates that we do not need to compute gradients
-    # with respect to these Tensors during the backward pass.
-    x = torch.randn(N, D_in, device=device, dtype=dtype)
-    y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-    # Create random Tensors for weights.
-    # Setting requires_grad=True indicates that we want to compute gradients with
-    # respect to these Tensors during the backward pass.
-    w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-    w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-    learning_rate = 1e-6
-    for t in range(500):
-        # Forward pass: compute predicted y using operations on Tensors; these
-        # are exactly the same operations we used to compute the forward pass using
-        # Tensors, but we do not need to keep references to intermediate values since
-        # we are not implementing the backward pass by hand.
-        y_pred = x.mm(w1).clamp(min=0).mm(w2)
-
-        # Compute and print loss using operations on Tensors.
-        # Now loss is a Tensor of shape (1,)
-        # loss.item() gets the scalar value held in the loss.
-        loss = (y_pred - y).pow(2).sum()
-        if t % 100 == 99:
-            print(t, loss.item())
-
-        # Use autograd to compute the backward pass. This call will compute the
-        # gradient of loss with respect to all Tensors with requires_grad=True.
-        # After this call w1.grad and w2.grad will be Tensors holding the gradient
-        # of the loss with respect to w1 and w2 respectively.
-        loss.backward()
-
-        # Manually update weights using gradient descent. Wrap in torch.no_grad()
-        # because weights have requires_grad=True, but we don't need to track this
-        # in autograd.
-        # An alternative way is to operate on weight.data and weight.grad.data.
-        # Recall that tensor.data gives a tensor that shares the storage with
-        # tensor, but doesn't track history.
-        # You can also use torch.optim.SGD to achieve this.
-        with torch.no_grad():
-            w1 -= learning_rate * w1.grad
-            w2 -= learning_rate * w2.grad
-
-            # Manually zero the gradients after updating weights
-            w1.grad.zero_()
-            w2.grad.zero_()
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_autograd_two_layer_net_autograd.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_autograd.py <two_layer_net_autograd.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_autograd.ipynb <two_layer_net_autograd.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_autograd/two_layer_net_custom_function.rst.txt b/_sources/beginner/examples_autograd/two_layer_net_custom_function.rst.txt
deleted file mode 100644
index 4ddd0580a97..00000000000
--- a/_sources/beginner/examples_autograd/two_layer_net_custom_function.rst.txt
+++ /dev/null
@@ -1,140 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_autograd_two_layer_net_custom_function.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_autograd_two_layer_net_custom_function.py:
-
-
-PyTorch: Defining New autograd Functions
-----------------------------------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation computes the forward pass using operations on PyTorch
-Variables, and uses PyTorch autograd to compute gradients.
-
-In this implementation we implement our own custom autograd function to perform
-the ReLU function.
-
-
-.. code-block:: default
-
-    import torch
-
-
-    class MyReLU(torch.autograd.Function):
-        """
-        We can implement our own custom autograd Functions by subclassing
-        torch.autograd.Function and implementing the forward and backward passes
-        which operate on Tensors.
-        """
-
-        @staticmethod
-        def forward(ctx, input):
-            """
-            In the forward pass we receive a Tensor containing the input and return
-            a Tensor containing the output. ctx is a context object that can be used
-            to stash information for backward computation. You can cache arbitrary
-            objects for use in the backward pass using the ctx.save_for_backward method.
-            """
-            ctx.save_for_backward(input)
-            return input.clamp(min=0)
-
-        @staticmethod
-        def backward(ctx, grad_output):
-            """
-            In the backward pass we receive a Tensor containing the gradient of the loss
-            with respect to the output, and we need to compute the gradient of the loss
-            with respect to the input.
-            """
-            input, = ctx.saved_tensors
-            grad_input = grad_output.clone()
-            grad_input[input < 0] = 0
-            return grad_input
-
-
-    dtype = torch.float
-    device = torch.device("cpu")
-    # device = torch.device("cuda:0")  # Uncomment this to run on GPU
-    # torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU
-
-    # The above line disables TensorFloat32. This a feature that allows
-    # networks to run at a much faster speed while sacrificing precision.
-    # Although TensorFloat32 works well on most real models, for our toy model
-    # in this tutorial, the sacrificed precision causes convergence issue.
-    # For more information, see:
-    # https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random Tensors to hold input and outputs.
-    x = torch.randn(N, D_in, device=device, dtype=dtype)
-    y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-    # Create random Tensors for weights.
-    w1 = torch.randn(D_in, H, device=device, dtype=dtype, requires_grad=True)
-    w2 = torch.randn(H, D_out, device=device, dtype=dtype, requires_grad=True)
-
-    learning_rate = 1e-6
-    for t in range(500):
-        # To apply our Function, we use Function.apply method. We alias this as 'relu'.
-        relu = MyReLU.apply
-
-        # Forward pass: compute predicted y using operations; we compute
-        # ReLU using our custom autograd operation.
-        y_pred = relu(x.mm(w1)).mm(w2)
-
-        # Compute and print loss
-        loss = (y_pred - y).pow(2).sum()
-        if t % 100 == 99:
-            print(t, loss.item())
-
-        # Use autograd to compute the backward pass.
-        loss.backward()
-
-        # Update weights using gradient descent
-        with torch.no_grad():
-            w1 -= learning_rate * w1.grad
-            w2 -= learning_rate * w2.grad
-
-            # Manually zero the gradients after updating weights
-            w1.grad.zero_()
-            w2.grad.zero_()
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_autograd_two_layer_net_custom_function.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_custom_function.py <two_layer_net_custom_function.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_custom_function.ipynb <two_layer_net_custom_function.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_nn/two_layer_net_module.rst.txt b/_sources/beginner/examples_nn/two_layer_net_module.rst.txt
deleted file mode 100644
index 011ecc94f87..00000000000
--- a/_sources/beginner/examples_nn/two_layer_net_module.rst.txt
+++ /dev/null
@@ -1,108 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_nn_two_layer_net_module.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_nn_two_layer_net_module.py:
-
-
-PyTorch: Custom nn Modules
---------------------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation defines the model as a custom Module subclass. Whenever you
-want a model more complex than a simple sequence of existing Modules you will
-need to define your model this way.
-
-
-.. code-block:: default
-
-    import torch
-
-
-    class TwoLayerNet(torch.nn.Module):
-        def __init__(self, D_in, H, D_out):
-            """
-            In the constructor we instantiate two nn.Linear modules and assign them as
-            member variables.
-            """
-            super(TwoLayerNet, self).__init__()
-            self.linear1 = torch.nn.Linear(D_in, H)
-            self.linear2 = torch.nn.Linear(H, D_out)
-
-        def forward(self, x):
-            """
-            In the forward function we accept a Tensor of input data and we must return
-            a Tensor of output data. We can use Modules defined in the constructor as
-            well as arbitrary operators on Tensors.
-            """
-            h_relu = self.linear1(x).clamp(min=0)
-            y_pred = self.linear2(h_relu)
-            return y_pred
-
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random Tensors to hold inputs and outputs
-    x = torch.randn(N, D_in)
-    y = torch.randn(N, D_out)
-
-    # Construct our model by instantiating the class defined above
-    model = TwoLayerNet(D_in, H, D_out)
-
-    # Construct our loss function and an Optimizer. The call to model.parameters()
-    # in the SGD constructor will contain the learnable parameters of the two
-    # nn.Linear modules which are members of the model.
-    criterion = torch.nn.MSELoss(reduction='sum')
-    optimizer = torch.optim.SGD(model.parameters(), lr=1e-4)
-    for t in range(500):
-        # Forward pass: Compute predicted y by passing x to the model
-        y_pred = model(x)
-
-        # Compute and print loss
-        loss = criterion(y_pred, y)
-        if t % 100 == 99:
-            print(t, loss.item())
-
-        # Zero gradients, perform a backward pass, and update the weights.
-        optimizer.zero_grad()
-        loss.backward()
-        optimizer.step()
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_nn_two_layer_net_module.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_module.py <two_layer_net_module.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_module.ipynb <two_layer_net_module.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_nn/two_layer_net_nn.rst.txt b/_sources/beginner/examples_nn/two_layer_net_nn.rst.txt
deleted file mode 100644
index 4ea77a90fb1..00000000000
--- a/_sources/beginner/examples_nn/two_layer_net_nn.rst.txt
+++ /dev/null
@@ -1,111 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_nn_two_layer_net_nn.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_nn_two_layer_net_nn.py:
-
-
-PyTorch: nn
------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-PyTorch autograd makes it easy to define computational graphs and take gradients,
-but raw autograd can be a bit too low-level for defining complex neural networks;
-this is where the nn package can help. The nn package defines a set of Modules,
-which you can think of as a neural network layer that has produces output from
-input and may have some trainable weights.
-
-
-.. code-block:: default
-
-    import torch
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random Tensors to hold inputs and outputs
-    x = torch.randn(N, D_in)
-    y = torch.randn(N, D_out)
-
-    # Use the nn package to define our model as a sequence of layers. nn.Sequential
-    # is a Module which contains other Modules, and applies them in sequence to
-    # produce its output. Each Linear Module computes output from input using a
-    # linear function, and holds internal Tensors for its weight and bias.
-    model = torch.nn.Sequential(
-        torch.nn.Linear(D_in, H),
-        torch.nn.ReLU(),
-        torch.nn.Linear(H, D_out),
-    )
-
-    # The nn package also contains definitions of popular loss functions; in this
-    # case we will use Mean Squared Error (MSE) as our loss function.
-    loss_fn = torch.nn.MSELoss(reduction='sum')
-
-    learning_rate = 1e-4
-    for t in range(500):
-        # Forward pass: compute predicted y by passing x to the model. Module objects
-        # override the __call__ operator so you can call them like functions. When
-        # doing so you pass a Tensor of input data to the Module and it produces
-        # a Tensor of output data.
-        y_pred = model(x)
-
-        # Compute and print loss. We pass Tensors containing the predicted and true
-        # values of y, and the loss function returns a Tensor containing the
-        # loss.
-        loss = loss_fn(y_pred, y)
-        if t % 100 == 99:
-            print(t, loss.item())
-
-        # Zero the gradients before running the backward pass.
-        model.zero_grad()
-
-        # Backward pass: compute gradient of the loss with respect to all the learnable
-        # parameters of the model. Internally, the parameters of each Module are stored
-        # in Tensors with requires_grad=True, so this call will compute gradients for
-        # all learnable parameters in the model.
-        loss.backward()
-
-        # Update the weights using gradient descent. Each parameter is a Tensor, so
-        # we can access its gradients like we did before.
-        with torch.no_grad():
-            for param in model.parameters():
-                param -= learning_rate * param.grad
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_nn_two_layer_net_nn.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_nn.py <two_layer_net_nn.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_nn.ipynb <two_layer_net_nn.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_nn/two_layer_net_optim.rst.txt b/_sources/beginner/examples_nn/two_layer_net_optim.rst.txt
deleted file mode 100644
index f446ee22650..00000000000
--- a/_sources/beginner/examples_nn/two_layer_net_optim.rst.txt
+++ /dev/null
@@ -1,105 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_nn_two_layer_net_optim.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_nn_two_layer_net_optim.py:
-
-
-PyTorch: optim
---------------
-
-A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.
-
-This implementation uses the nn package from PyTorch to build the network.
-
-Rather than manually updating the weights of the model as we have been doing,
-we use the optim package to define an Optimizer that will update the weights
-for us. The optim package defines many optimization algorithms that are commonly
-used for deep learning, including SGD+momentum, RMSProp, Adam, etc.
-
-
-.. code-block:: default
-
-    import torch
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random Tensors to hold inputs and outputs
-    x = torch.randn(N, D_in)
-    y = torch.randn(N, D_out)
-
-    # Use the nn package to define our model and loss function.
-    model = torch.nn.Sequential(
-        torch.nn.Linear(D_in, H),
-        torch.nn.ReLU(),
-        torch.nn.Linear(H, D_out),
-    )
-    loss_fn = torch.nn.MSELoss(reduction='sum')
-
-    # Use the optim package to define an Optimizer that will update the weights of
-    # the model for us. Here we will use Adam; the optim package contains many other
-    # optimization algorithms. The first argument to the Adam constructor tells the
-    # optimizer which Tensors it should update.
-    learning_rate = 1e-4
-    optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)
-    for t in range(500):
-        # Forward pass: compute predicted y by passing x to the model.
-        y_pred = model(x)
-
-        # Compute and print loss.
-        loss = loss_fn(y_pred, y)
-        if t % 100 == 99:
-            print(t, loss.item())
-
-        # Before the backward pass, use the optimizer object to zero all of the
-        # gradients for the variables it will update (which are the learnable
-        # weights of the model). This is because by default, gradients are
-        # accumulated in buffers( i.e, not overwritten) whenever .backward()
-        # is called. Checkout docs of torch.autograd.backward for more details.
-        optimizer.zero_grad()
-
-        # Backward pass: compute gradient of the loss with respect to model
-        # parameters
-        loss.backward()
-
-        # Calling the step function on an Optimizer makes an update to its
-        # parameters
-        optimizer.step()
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_nn_two_layer_net_optim.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_optim.py <two_layer_net_optim.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_optim.ipynb <two_layer_net_optim.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_tensor/two_layer_net_numpy.rst.txt b/_sources/beginner/examples_tensor/two_layer_net_numpy.rst.txt
deleted file mode 100644
index 5e2010d7848..00000000000
--- a/_sources/beginner/examples_tensor/two_layer_net_numpy.rst.txt
+++ /dev/null
@@ -1,94 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_tensor_two_layer_net_numpy.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_tensor_two_layer_net_numpy.py:
-
-
-Warm-up: numpy
---------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x using Euclidean error.
-
-This implementation uses numpy to manually compute the forward pass, loss, and
-backward pass.
-
-A numpy array is a generic n-dimensional array; it does not know anything about
-deep learning or gradients or computational graphs, and is just a way to perform
-generic numeric computations.
-
-
-.. code-block:: default
-
-    import numpy as np
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random input and output data
-    x = np.random.randn(N, D_in)
-    y = np.random.randn(N, D_out)
-
-    # Randomly initialize weights
-    w1 = np.random.randn(D_in, H)
-    w2 = np.random.randn(H, D_out)
-
-    learning_rate = 1e-6
-    for t in range(500):
-        # Forward pass: compute predicted y
-        h = x.dot(w1)
-        h_relu = np.maximum(h, 0)
-        y_pred = h_relu.dot(w2)
-
-        # Compute and print loss
-        loss = np.square(y_pred - y).sum()
-        print(t, loss)
-
-        # Backprop to compute gradients of w1 and w2 with respect to loss
-        grad_y_pred = 2.0 * (y_pred - y)
-        grad_w2 = h_relu.T.dot(grad_y_pred)
-        grad_h_relu = grad_y_pred.dot(w2.T)
-        grad_h = grad_h_relu.copy()
-        grad_h[h < 0] = 0
-        grad_w1 = x.T.dot(grad_h)
-
-        # Update weights
-        w1 -= learning_rate * grad_w1
-        w2 -= learning_rate * grad_w2
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_tensor_two_layer_net_numpy.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_numpy.py <two_layer_net_numpy.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_numpy.ipynb <two_layer_net_numpy.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/_sources/beginner/examples_tensor/two_layer_net_tensor.rst.txt b/_sources/beginner/examples_tensor/two_layer_net_tensor.rst.txt
deleted file mode 100644
index 3d6a79bb0aa..00000000000
--- a/_sources/beginner/examples_tensor/two_layer_net_tensor.rst.txt
+++ /dev/null
@@ -1,105 +0,0 @@
-.. note::
-    :class: sphx-glr-download-link-note
-
-    Click :ref:`here <sphx_glr_download_beginner_examples_tensor_two_layer_net_tensor.py>` to download the full example code
-.. rst-class:: sphx-glr-example-title
-
-.. _sphx_glr_beginner_examples_tensor_two_layer_net_tensor.py:
-
-
-PyTorch: Tensors
-----------------
-
-A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.
-
-This implementation uses PyTorch tensors to manually compute the forward pass,
-loss, and backward pass.
-
-A PyTorch Tensor is basically the same as a numpy array: it does not know
-anything about deep learning or computational graphs or gradients, and is just
-a generic n-dimensional array to be used for arbitrary numeric computation.
-
-The biggest difference between a numpy array and a PyTorch Tensor is that
-a PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,
-just cast the Tensor to a cuda datatype.
-
-
-.. code-block:: default
-
-
-    import torch
-
-
-    dtype = torch.float
-    device = torch.device("cpu")
-    # device = torch.device("cuda:0") # Uncomment this to run on GPU
-
-    # N is batch size; D_in is input dimension;
-    # H is hidden dimension; D_out is output dimension.
-    N, D_in, H, D_out = 64, 1000, 100, 10
-
-    # Create random input and output data
-    x = torch.randn(N, D_in, device=device, dtype=dtype)
-    y = torch.randn(N, D_out, device=device, dtype=dtype)
-
-    # Randomly initialize weights
-    w1 = torch.randn(D_in, H, device=device, dtype=dtype)
-    w2 = torch.randn(H, D_out, device=device, dtype=dtype)
-
-    learning_rate = 1e-6
-    for t in range(500):
-        # Forward pass: compute predicted y
-        h = x.mm(w1)
-        h_relu = h.clamp(min=0)
-        y_pred = h_relu.mm(w2)
-
-        # Compute and print loss
-        loss = (y_pred - y).pow(2).sum().item()
-        if t % 100 == 99:
-            print(t, loss)
-
-        # Backprop to compute gradients of w1 and w2 with respect to loss
-        grad_y_pred = 2.0 * (y_pred - y)
-        grad_w2 = h_relu.t().mm(grad_y_pred)
-        grad_h_relu = grad_y_pred.mm(w2.t())
-        grad_h = grad_h_relu.clone()
-        grad_h[h < 0] = 0
-        grad_w1 = x.t().mm(grad_h)
-
-        # Update weights using gradient descent
-        w1 -= learning_rate * grad_w1
-        w2 -= learning_rate * grad_w2
-
-
-.. rst-class:: sphx-glr-timing
-
-   **Total running time of the script:** ( 0 minutes  0.000 seconds)
-
-
-.. _sphx_glr_download_beginner_examples_tensor_two_layer_net_tensor.py:
-
-
-.. only :: html
-
- .. container:: sphx-glr-footer
-    :class: sphx-glr-footer-example
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Python source code: two_layer_net_tensor.py <two_layer_net_tensor.py>`
-
-
-
-  .. container:: sphx-glr-download
-
-     :download:`Download Jupyter notebook: two_layer_net_tensor.ipynb <two_layer_net_tensor.ipynb>`
-
-
-.. only:: html
-
- .. rst-class:: sphx-glr-signature
-
-    `Gallery generated by Sphinx-Gallery <https://sphinx-gallery.readthedocs.io>`_
diff --git a/beginner/examples_autograd/two_layer_net_autograd.html b/beginner/examples_autograd/two_layer_net_autograd.html
deleted file mode 100644
index ba5da4ddc7c..00000000000
--- a/beginner/examples_autograd/two_layer_net_autograd.html
+++ /dev/null
@@ -1,618 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: Tensors and autograd — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="two_layer_net_custom_function.html" rel="next" title="PyTorch: Defining New autograd Functions"/>
-<link href="../examples_tensor/two_layer_net_tensor.html" rel="prev" title="PyTorch: Tensors"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: Tensors and autograd</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_autograd/two_layer_net_autograd.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_autograd/two_layer_net_autograd</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-autograd-two-layer-net-autograd-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-tensors-and-autograd">
-<span id="sphx-glr-beginner-examples-autograd-two-layer-net-autograd-py"></span><h1>PyTorch: Tensors and autograd<a class="headerlink" href="#pytorch-tensors-and-autograd" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.</p>
-<p>This implementation computes the forward pass using operations on PyTorch
-Tensors, and uses PyTorch autograd to compute gradients.</p>
-<p>A PyTorch Tensor represents a node in a computational graph. If <code class="docutils literal notranslate"><span class="pre">x</span></code> is a
-Tensor that has <code class="docutils literal notranslate"><span class="pre">x.requires_grad=True</span></code> then <code class="docutils literal notranslate"><span class="pre">x.grad</span></code> is another Tensor
-holding the gradient of <code class="docutils literal notranslate"><span class="pre">x</span></code> with respect to some scalar value.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-<span class="n">dtype</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">float</span>
-<span class="n">device</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">"cpu"</span><span class="p">)</span>
-<span class="c1"># device = torch.device("cuda:0")  # Uncomment this to run on GPU</span>
-<span class="c1"># torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU</span>
-
-<span class="c1"># The above line disables TensorFloat32. This a feature that allows</span>
-<span class="c1"># networks to run at a much faster speed while sacrificing precision.</span>
-<span class="c1"># Although TensorFloat32 works well on most real models, for our toy model</span>
-<span class="c1"># in this tutorial, the sacrificed precision causes convergence issue.</span>
-<span class="c1"># For more information, see:</span>
-<span class="c1"># https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random Tensors to hold input and outputs.</span>
-<span class="c1"># Setting requires_grad=False indicates that we do not need to compute gradients</span>
-<span class="c1"># with respect to these Tensors during the backward pass.</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-
-<span class="c1"># Create random Tensors for weights.</span>
-<span class="c1"># Setting requires_grad=True indicates that we want to compute gradients with</span>
-<span class="c1"># respect to these Tensors during the backward pass.</span>
-<span class="n">w1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">,</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
-<span class="n">w2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">,</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
-
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-6</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: compute predicted y using operations on Tensors; these</span>
-    <span class="c1"># are exactly the same operations we used to compute the forward pass using</span>
-    <span class="c1"># Tensors, but we do not need to keep references to intermediate values since</span>
-    <span class="c1"># we are not implementing the backward pass by hand.</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w1</span><span class="p">)</span><span class="o">.</span><span class="n">clamp</span><span class="p">(</span><span class="nb">min</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w2</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss using operations on Tensors.</span>
-    <span class="c1"># Now loss is a Tensor of shape (1,)</span>
-    <span class="c1"># loss.item() gets the scalar value held in the loss.</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span><span class="o">.</span><span class="n">pow</span><span class="p">(</span><span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="o">.</span><span class="n">item</span><span class="p">())</span>
-
-    <span class="c1"># Use autograd to compute the backward pass. This call will compute the</span>
-    <span class="c1"># gradient of loss with respect to all Tensors with requires_grad=True.</span>
-    <span class="c1"># After this call w1.grad and w2.grad will be Tensors holding the gradient</span>
-    <span class="c1"># of the loss with respect to w1 and w2 respectively.</span>
-    <span class="n">loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span>
-
-    <span class="c1"># Manually update weights using gradient descent. Wrap in torch.no_grad()</span>
-    <span class="c1"># because weights have requires_grad=True, but we don't need to track this</span>
-    <span class="c1"># in autograd.</span>
-    <span class="c1"># An alternative way is to operate on weight.data and weight.grad.data.</span>
-    <span class="c1"># Recall that tensor.data gives a tensor that shares the storage with</span>
-    <span class="c1"># tensor, but doesn't track history.</span>
-    <span class="c1"># You can also use torch.optim.SGD to achieve this.</span>
-    <span class="k">with</span> <span class="n">torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">():</span>
-        <span class="n">w1</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">w1</span><span class="o">.</span><span class="n">grad</span>
-        <span class="n">w2</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">w2</span><span class="o">.</span><span class="n">grad</span>
-
-        <span class="c1"># Manually zero the gradients after updating weights</span>
-        <span class="n">w1</span><span class="o">.</span><span class="n">grad</span><span class="o">.</span><span class="n">zero_</span><span class="p">()</span>
-        <span class="n">w2</span><span class="o">.</span><span class="n">grad</span><span class="o">.</span><span class="n">zero_</span><span class="p">()</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-autograd-two-layer-net-autograd-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/e11b7a716744fc603445217d61ec787f/two_layer_net_autograd.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_autograd.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/b8ed57e2c40a637d92a891b4cf7e72f6/two_layer_net_autograd.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_autograd.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="two_layer_net_custom_function.html" rel="next" title="PyTorch: Defining New autograd Functions">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="../examples_tensor/two_layer_net_tensor.html" rel="prev" title="PyTorch: Tensors"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: Tensors and autograd</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_autograd/two_layer_net_autograd.html b/beginner/examples_autograd/two_layer_net_autograd.html
new file mode 120000
index 00000000000..b3becdbca4e
--- /dev/null
+++ b/beginner/examples_autograd/two_layer_net_autograd.html
@@ -0,0 +1 @@
+beginner/examples_autograd/polynomial_autograd.html
\ No newline at end of file
diff --git a/beginner/examples_autograd/two_layer_net_custom_function.html b/beginner/examples_autograd/two_layer_net_custom_function.html
deleted file mode 100644
index a9997362691..00000000000
--- a/beginner/examples_autograd/two_layer_net_custom_function.html
+++ /dev/null
@@ -1,635 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: Defining New autograd Functions — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="tf_two_layer_net.html" rel="next" title="TensorFlow: Static Graphs"/>
-<link href="two_layer_net_autograd.html" rel="prev" title="PyTorch: Tensors and autograd"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: Defining New autograd Functions</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_autograd/two_layer_net_custom_function.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_autograd/two_layer_net_custom_function</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-autograd-two-layer-net-custom-function-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-defining-new-autograd-functions">
-<span id="sphx-glr-beginner-examples-autograd-two-layer-net-custom-function-py"></span><h1>PyTorch: Defining New autograd Functions<a class="headerlink" href="#pytorch-defining-new-autograd-functions" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.</p>
-<p>This implementation computes the forward pass using operations on PyTorch
-Variables, and uses PyTorch autograd to compute gradients.</p>
-<p>In this implementation we implement our own custom autograd function to perform
-the ReLU function.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-
-<span class="k">class</span> <span class="nc">MyReLU</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">autograd</span><span class="o">.</span><span class="n">Function</span><span class="p">):</span>
-    <span class="sd">"""</span>
-<span class="sd">    We can implement our own custom autograd Functions by subclassing</span>
-<span class="sd">    torch.autograd.Function and implementing the forward and backward passes</span>
-<span class="sd">    which operate on Tensors.</span>
-<span class="sd">    """</span>
-
-    <span class="nd">@staticmethod</span>
-    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="n">ctx</span><span class="p">,</span> <span class="nb">input</span><span class="p">):</span>
-        <span class="sd">"""</span>
-<span class="sd">        In the forward pass we receive a Tensor containing the input and return</span>
-<span class="sd">        a Tensor containing the output. ctx is a context object that can be used</span>
-<span class="sd">        to stash information for backward computation. You can cache arbitrary</span>
-<span class="sd">        objects for use in the backward pass using the ctx.save_for_backward method.</span>
-<span class="sd">        """</span>
-        <span class="n">ctx</span><span class="o">.</span><span class="n">save_for_backward</span><span class="p">(</span><span class="nb">input</span><span class="p">)</span>
-        <span class="k">return</span> <span class="nb">input</span><span class="o">.</span><span class="n">clamp</span><span class="p">(</span><span class="nb">min</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span>
-
-    <span class="nd">@staticmethod</span>
-    <span class="k">def</span> <span class="nf">backward</span><span class="p">(</span><span class="n">ctx</span><span class="p">,</span> <span class="n">grad_output</span><span class="p">):</span>
-        <span class="sd">"""</span>
-<span class="sd">        In the backward pass we receive a Tensor containing the gradient of the loss</span>
-<span class="sd">        with respect to the output, and we need to compute the gradient of the loss</span>
-<span class="sd">        with respect to the input.</span>
-<span class="sd">        """</span>
-        <span class="nb">input</span><span class="p">,</span> <span class="o">=</span> <span class="n">ctx</span><span class="o">.</span><span class="n">saved_tensors</span>
-        <span class="n">grad_input</span> <span class="o">=</span> <span class="n">grad_output</span><span class="o">.</span><span class="n">clone</span><span class="p">()</span>
-        <span class="n">grad_input</span><span class="p">[</span><span class="nb">input</span> <span class="o">&lt;</span> <span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="mi">0</span>
-        <span class="k">return</span> <span class="n">grad_input</span>
-
-
-<span class="n">dtype</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">float</span>
-<span class="n">device</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">"cpu"</span><span class="p">)</span>
-<span class="c1"># device = torch.device("cuda:0")  # Uncomment this to run on GPU</span>
-<span class="c1"># torch.backends.cuda.matmul.allow_tf32 = False  # Uncomment this to run on GPU</span>
-
-<span class="c1"># The above line disables TensorFloat32. This a feature that allows</span>
-<span class="c1"># networks to run at a much faster speed while sacrificing precision.</span>
-<span class="c1"># Although TensorFloat32 works well on most real models, for our toy model</span>
-<span class="c1"># in this tutorial, the sacrificed precision causes convergence issue.</span>
-<span class="c1"># For more information, see:</span>
-<span class="c1"># https://pytorch.org/docs/stable/notes/cuda.html#tensorfloat-32-tf32-on-ampere-devices</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random Tensors to hold input and outputs.</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-
-<span class="c1"># Create random Tensors for weights.</span>
-<span class="n">w1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">,</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
-<span class="n">w2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">,</span> <span class="n">requires_grad</span><span class="o">=</span><span class="kc">True</span><span class="p">)</span>
-
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-6</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># To apply our Function, we use Function.apply method. We alias this as 'relu'.</span>
-    <span class="n">relu</span> <span class="o">=</span> <span class="n">MyReLU</span><span class="o">.</span><span class="n">apply</span>
-
-    <span class="c1"># Forward pass: compute predicted y using operations; we compute</span>
-    <span class="c1"># ReLU using our custom autograd operation.</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">relu</span><span class="p">(</span><span class="n">x</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w1</span><span class="p">))</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w2</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span><span class="o">.</span><span class="n">pow</span><span class="p">(</span><span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="o">.</span><span class="n">item</span><span class="p">())</span>
-
-    <span class="c1"># Use autograd to compute the backward pass.</span>
-    <span class="n">loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span>
-
-    <span class="c1"># Update weights using gradient descent</span>
-    <span class="k">with</span> <span class="n">torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">():</span>
-        <span class="n">w1</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">w1</span><span class="o">.</span><span class="n">grad</span>
-        <span class="n">w2</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">w2</span><span class="o">.</span><span class="n">grad</span>
-
-        <span class="c1"># Manually zero the gradients after updating weights</span>
-        <span class="n">w1</span><span class="o">.</span><span class="n">grad</span><span class="o">.</span><span class="n">zero_</span><span class="p">()</span>
-        <span class="n">w2</span><span class="o">.</span><span class="n">grad</span><span class="o">.</span><span class="n">zero_</span><span class="p">()</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-autograd-two-layer-net-custom-function-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/22f070e74b4f293045131e7170efe86d/two_layer_net_custom_function.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_custom_function.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/7df1a8d6c18d6c7122649856a1ac16b8/two_layer_net_custom_function.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_custom_function.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="tf_two_layer_net.html" rel="next" title="TensorFlow: Static Graphs">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="two_layer_net_autograd.html" rel="prev" title="PyTorch: Tensors and autograd"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: Defining New autograd Functions</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_autograd/two_layer_net_custom_function.html b/beginner/examples_autograd/two_layer_net_custom_function.html
new file mode 120000
index 00000000000..76ad5f084ae
--- /dev/null
+++ b/beginner/examples_autograd/two_layer_net_custom_function.html
@@ -0,0 +1 @@
+beginner/examples_autograd/polynomial_custom_function.html
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_module.html b/beginner/examples_nn/two_layer_net_module.html
deleted file mode 100644
index 68cb0e0c277..00000000000
--- a/beginner/examples_nn/two_layer_net_module.html
+++ /dev/null
@@ -1,604 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: Custom nn Modules — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="dynamic_net.html" rel="next" title="PyTorch: Control Flow + Weight Sharing"/>
-<link href="two_layer_net_optim.html" rel="prev" title="PyTorch: optim"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: Custom nn Modules</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_nn/two_layer_net_module.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_nn/two_layer_net_module</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-nn-two-layer-net-module-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-custom-nn-modules">
-<span id="sphx-glr-beginner-examples-nn-two-layer-net-module-py"></span><h1>PyTorch: Custom nn Modules<a class="headerlink" href="#pytorch-custom-nn-modules" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.</p>
-<p>This implementation defines the model as a custom Module subclass. Whenever you
-want a model more complex than a simple sequence of existing Modules you will
-need to define your model this way.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-
-<span class="k">class</span> <span class="nc">TwoLayerNet</span><span class="p">(</span><span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Module</span><span class="p">):</span>
-    <span class="k">def</span> <span class="fm">__init__</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">):</span>
-        <span class="sd">"""</span>
-<span class="sd">        In the constructor we instantiate two nn.Linear modules and assign them as</span>
-<span class="sd">        member variables.</span>
-<span class="sd">        """</span>
-        <span class="nb">super</span><span class="p">(</span><span class="n">TwoLayerNet</span><span class="p">,</span> <span class="bp">self</span><span class="p">)</span><span class="o">.</span><span class="fm">__init__</span><span class="p">()</span>
-        <span class="bp">self</span><span class="o">.</span><span class="n">linear1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">)</span>
-        <span class="bp">self</span><span class="o">.</span><span class="n">linear2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-    <span class="k">def</span> <span class="nf">forward</span><span class="p">(</span><span class="bp">self</span><span class="p">,</span> <span class="n">x</span><span class="p">):</span>
-        <span class="sd">"""</span>
-<span class="sd">        In the forward function we accept a Tensor of input data and we must return</span>
-<span class="sd">        a Tensor of output data. We can use Modules defined in the constructor as</span>
-<span class="sd">        well as arbitrary operators on Tensors.</span>
-<span class="sd">        """</span>
-        <span class="n">h_relu</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">linear1</span><span class="p">(</span><span class="n">x</span><span class="p">)</span><span class="o">.</span><span class="n">clamp</span><span class="p">(</span><span class="nb">min</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span>
-        <span class="n">y_pred</span> <span class="o">=</span> <span class="bp">self</span><span class="o">.</span><span class="n">linear2</span><span class="p">(</span><span class="n">h_relu</span><span class="p">)</span>
-        <span class="k">return</span> <span class="n">y_pred</span>
-
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random Tensors to hold inputs and outputs</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="c1"># Construct our model by instantiating the class defined above</span>
-<span class="n">model</span> <span class="o">=</span> <span class="n">TwoLayerNet</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="c1"># Construct our loss function and an Optimizer. The call to model.parameters()</span>
-<span class="c1"># in the SGD constructor will contain the learnable parameters of the two</span>
-<span class="c1"># nn.Linear modules which are members of the model.</span>
-<span class="n">criterion</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">MSELoss</span><span class="p">(</span><span class="n">reduction</span><span class="o">=</span><span class="s1">'sum'</span><span class="p">)</span>
-<span class="n">optimizer</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">SGD</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span> <span class="n">lr</span><span class="o">=</span><span class="mf">1e-4</span><span class="p">)</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: Compute predicted y by passing x to the model</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">model</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="n">criterion</span><span class="p">(</span><span class="n">y_pred</span><span class="p">,</span> <span class="n">y</span><span class="p">)</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="o">.</span><span class="n">item</span><span class="p">())</span>
-
-    <span class="c1"># Zero gradients, perform a backward pass, and update the weights.</span>
-    <span class="n">optimizer</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span>
-    <span class="n">loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span>
-    <span class="n">optimizer</span><span class="o">.</span><span class="n">step</span><span class="p">()</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-nn-two-layer-net-module-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/fa9717a4ee4117e114380fe627b1350c/two_layer_net_module.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_module.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/843ace305951b2a897f80a52e1189938/two_layer_net_module.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_module.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="dynamic_net.html" rel="next" title="PyTorch: Control Flow + Weight Sharing">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="two_layer_net_optim.html" rel="prev" title="PyTorch: optim"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: Custom nn Modules</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_module.html b/beginner/examples_nn/two_layer_net_module.html
new file mode 120000
index 00000000000..4cbc2016dcb
--- /dev/null
+++ b/beginner/examples_nn/two_layer_net_module.html
@@ -0,0 +1 @@
+beginner/examples_nn/polynomial_module.html
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_nn.html b/beginner/examples_nn/two_layer_net_nn.html
deleted file mode 100644
index bb76ff0796f..00000000000
--- a/beginner/examples_nn/two_layer_net_nn.html
+++ /dev/null
@@ -1,607 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: nn — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="two_layer_net_optim.html" rel="next" title="PyTorch: optim"/>
-<link href="../examples_autograd/tf_two_layer_net.html" rel="prev" title="TensorFlow: Static Graphs"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: nn</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_nn/two_layer_net_nn.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_nn/two_layer_net_nn</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-nn-two-layer-net-nn-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-nn">
-<span id="sphx-glr-beginner-examples-nn-two-layer-net-nn-py"></span><h1>PyTorch: nn<a class="headerlink" href="#pytorch-nn" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.</p>
-<p>This implementation uses the nn package from PyTorch to build the network.
-PyTorch autograd makes it easy to define computational graphs and take gradients,
-but raw autograd can be a bit too low-level for defining complex neural networks;
-this is where the nn package can help. The nn package defines a set of Modules,
-which you can think of as a neural network layer that has produces output from
-input and may have some trainable weights.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random Tensors to hold inputs and outputs</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="c1"># Use the nn package to define our model as a sequence of layers. nn.Sequential</span>
-<span class="c1"># is a Module which contains other Modules, and applies them in sequence to</span>
-<span class="c1"># produce its output. Each Linear Module computes output from input using a</span>
-<span class="c1"># linear function, and holds internal Tensors for its weight and bias.</span>
-<span class="n">model</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">),</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">ReLU</span><span class="p">(),</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">),</span>
-<span class="p">)</span>
-
-<span class="c1"># The nn package also contains definitions of popular loss functions; in this</span>
-<span class="c1"># case we will use Mean Squared Error (MSE) as our loss function.</span>
-<span class="n">loss_fn</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">MSELoss</span><span class="p">(</span><span class="n">reduction</span><span class="o">=</span><span class="s1">'sum'</span><span class="p">)</span>
-
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-4</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: compute predicted y by passing x to the model. Module objects</span>
-    <span class="c1"># override the __call__ operator so you can call them like functions. When</span>
-    <span class="c1"># doing so you pass a Tensor of input data to the Module and it produces</span>
-    <span class="c1"># a Tensor of output data.</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">model</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss. We pass Tensors containing the predicted and true</span>
-    <span class="c1"># values of y, and the loss function returns a Tensor containing the</span>
-    <span class="c1"># loss.</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="n">loss_fn</span><span class="p">(</span><span class="n">y_pred</span><span class="p">,</span> <span class="n">y</span><span class="p">)</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="o">.</span><span class="n">item</span><span class="p">())</span>
-
-    <span class="c1"># Zero the gradients before running the backward pass.</span>
-    <span class="n">model</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span>
-
-    <span class="c1"># Backward pass: compute gradient of the loss with respect to all the learnable</span>
-    <span class="c1"># parameters of the model. Internally, the parameters of each Module are stored</span>
-    <span class="c1"># in Tensors with requires_grad=True, so this call will compute gradients for</span>
-    <span class="c1"># all learnable parameters in the model.</span>
-    <span class="n">loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span>
-
-    <span class="c1"># Update the weights using gradient descent. Each parameter is a Tensor, so</span>
-    <span class="c1"># we can access its gradients like we did before.</span>
-    <span class="k">with</span> <span class="n">torch</span><span class="o">.</span><span class="n">no_grad</span><span class="p">():</span>
-        <span class="k">for</span> <span class="n">param</span> <span class="ow">in</span> <span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">():</span>
-            <span class="n">param</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">param</span><span class="o">.</span><span class="n">grad</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-nn-two-layer-net-nn-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/39d9c599559353177d1597d787c8e2fd/two_layer_net_nn.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_nn.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/7f1a8a2cb5a62c19268b29c5a0d7a859/two_layer_net_nn.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_nn.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="two_layer_net_optim.html" rel="next" title="PyTorch: optim">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="../examples_autograd/tf_two_layer_net.html" rel="prev" title="TensorFlow: Static Graphs"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: nn</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_nn.html b/beginner/examples_nn/two_layer_net_nn.html
new file mode 120000
index 00000000000..a398f26bb6f
--- /dev/null
+++ b/beginner/examples_nn/two_layer_net_nn.html
@@ -0,0 +1 @@
+beginner/examples_nn/polynomial_nn.html
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_optim.html b/beginner/examples_nn/two_layer_net_optim.html
deleted file mode 100644
index 44836b3045c..00000000000
--- a/beginner/examples_nn/two_layer_net_optim.html
+++ /dev/null
@@ -1,600 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: optim — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="two_layer_net_module.html" rel="next" title="PyTorch: Custom nn Modules"/>
-<link href="two_layer_net_nn.html" rel="prev" title="PyTorch: nn"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: optim</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_nn/two_layer_net_optim.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_nn/two_layer_net_optim</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-nn-two-layer-net-optim-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-optim">
-<span id="sphx-glr-beginner-examples-nn-two-layer-net-optim-py"></span><h1>PyTorch: optim<a class="headerlink" href="#pytorch-optim" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer, trained to predict y from x
-by minimizing squared Euclidean distance.</p>
-<p>This implementation uses the nn package from PyTorch to build the network.</p>
-<p>Rather than manually updating the weights of the model as we have been doing,
-we use the optim package to define an Optimizer that will update the weights
-for us. The optim package defines many optimization algorithms that are commonly
-used for deep learning, including SGD+momentum, RMSProp, Adam, etc.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random Tensors to hold inputs and outputs</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="c1"># Use the nn package to define our model and loss function.</span>
-<span class="n">model</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Sequential</span><span class="p">(</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">),</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">ReLU</span><span class="p">(),</span>
-    <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">Linear</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">),</span>
-<span class="p">)</span>
-<span class="n">loss_fn</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">nn</span><span class="o">.</span><span class="n">MSELoss</span><span class="p">(</span><span class="n">reduction</span><span class="o">=</span><span class="s1">'sum'</span><span class="p">)</span>
-
-<span class="c1"># Use the optim package to define an Optimizer that will update the weights of</span>
-<span class="c1"># the model for us. Here we will use Adam; the optim package contains many other</span>
-<span class="c1"># optimization algorithms. The first argument to the Adam constructor tells the</span>
-<span class="c1"># optimizer which Tensors it should update.</span>
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-4</span>
-<span class="n">optimizer</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">optim</span><span class="o">.</span><span class="n">Adam</span><span class="p">(</span><span class="n">model</span><span class="o">.</span><span class="n">parameters</span><span class="p">(),</span> <span class="n">lr</span><span class="o">=</span><span class="n">learning_rate</span><span class="p">)</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: compute predicted y by passing x to the model.</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">model</span><span class="p">(</span><span class="n">x</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss.</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="n">loss_fn</span><span class="p">(</span><span class="n">y_pred</span><span class="p">,</span> <span class="n">y</span><span class="p">)</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="o">.</span><span class="n">item</span><span class="p">())</span>
-
-    <span class="c1"># Before the backward pass, use the optimizer object to zero all of the</span>
-    <span class="c1"># gradients for the variables it will update (which are the learnable</span>
-    <span class="c1"># weights of the model). This is because by default, gradients are</span>
-    <span class="c1"># accumulated in buffers( i.e, not overwritten) whenever .backward()</span>
-    <span class="c1"># is called. Checkout docs of torch.autograd.backward for more details.</span>
-    <span class="n">optimizer</span><span class="o">.</span><span class="n">zero_grad</span><span class="p">()</span>
-
-    <span class="c1"># Backward pass: compute gradient of the loss with respect to model</span>
-    <span class="c1"># parameters</span>
-    <span class="n">loss</span><span class="o">.</span><span class="n">backward</span><span class="p">()</span>
-
-    <span class="c1"># Calling the step function on an Optimizer makes an update to its</span>
-    <span class="c1"># parameters</span>
-    <span class="n">optimizer</span><span class="o">.</span><span class="n">step</span><span class="p">()</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-nn-two-layer-net-optim-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/1c22195f47cf0e89ae2e0989dd4be6bb/two_layer_net_optim.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_optim.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/a48ba4d15c30996aeba51337fb0c8dd7/two_layer_net_optim.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_optim.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="two_layer_net_module.html" rel="next" title="PyTorch: Custom nn Modules">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="two_layer_net_nn.html" rel="prev" title="PyTorch: nn"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: optim</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_nn/two_layer_net_optim.html b/beginner/examples_nn/two_layer_net_optim.html
new file mode 120000
index 00000000000..7e7a248b13d
--- /dev/null
+++ b/beginner/examples_nn/two_layer_net_optim.html
@@ -0,0 +1 @@
+beginner/examples_nn/polynomial_optim.html
\ No newline at end of file
diff --git a/beginner/examples_tensor/two_layer_net_numpy.html b/beginner/examples_tensor/two_layer_net_numpy.html
deleted file mode 100644
index 0ff835eea31..00000000000
--- a/beginner/examples_tensor/two_layer_net_numpy.html
+++ /dev/null
@@ -1,589 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>Warm-up: numpy — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="two_layer_net_tensor.html" rel="next" title="PyTorch: Tensors"/>
-<link href="../pytorch_with_examples.html" rel="prev" title="Learning PyTorch with Examples"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>Warm-up: numpy</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_tensor/two_layer_net_numpy.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_tensor/two_layer_net_numpy</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-tensor-two-layer-net-numpy-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="warm-up-numpy">
-<span id="sphx-glr-beginner-examples-tensor-two-layer-net-numpy-py"></span><h1>Warm-up: numpy<a class="headerlink" href="#warm-up-numpy" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x using Euclidean error.</p>
-<p>This implementation uses numpy to manually compute the forward pass, loss, and
-backward pass.</p>
-<p>A numpy array is a generic n-dimensional array; it does not know anything about
-deep learning or gradients or computational graphs, and is just a way to perform
-generic numeric computations.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">numpy</span> <span class="k">as</span> <span class="nn">np</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random input and output data</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="c1"># Randomly initialize weights</span>
-<span class="n">w1</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">)</span>
-<span class="n">w2</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">random</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">)</span>
-
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-6</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: compute predicted y</span>
-    <span class="n">h</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">w1</span><span class="p">)</span>
-    <span class="n">h_relu</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">maximum</span><span class="p">(</span><span class="n">h</span><span class="p">,</span> <span class="mi">0</span><span class="p">)</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">h_relu</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">w2</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="n">np</span><span class="o">.</span><span class="n">square</span><span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span>
-    <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="p">)</span>
-
-    <span class="c1"># Backprop to compute gradients of w1 and w2 with respect to loss</span>
-    <span class="n">grad_y_pred</span> <span class="o">=</span> <span class="mf">2.0</span> <span class="o">*</span> <span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span>
-    <span class="n">grad_w2</span> <span class="o">=</span> <span class="n">h_relu</span><span class="o">.</span><span class="n">T</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">grad_y_pred</span><span class="p">)</span>
-    <span class="n">grad_h_relu</span> <span class="o">=</span> <span class="n">grad_y_pred</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">w2</span><span class="o">.</span><span class="n">T</span><span class="p">)</span>
-    <span class="n">grad_h</span> <span class="o">=</span> <span class="n">grad_h_relu</span><span class="o">.</span><span class="n">copy</span><span class="p">()</span>
-    <span class="n">grad_h</span><span class="p">[</span><span class="n">h</span> <span class="o">&lt;</span> <span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="mi">0</span>
-    <span class="n">grad_w1</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">T</span><span class="o">.</span><span class="n">dot</span><span class="p">(</span><span class="n">grad_h</span><span class="p">)</span>
-
-    <span class="c1"># Update weights</span>
-    <span class="n">w1</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">grad_w1</span>
-    <span class="n">w2</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">grad_w2</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-tensor-two-layer-net-numpy-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/445f984d6e8c379cf0aefd16ef44a4da/two_layer_net_numpy.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_numpy.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/f00a2a1e490ec62f7c1bcb950318b7f7/two_layer_net_numpy.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_numpy.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="two_layer_net_tensor.html" rel="next" title="PyTorch: Tensors">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="../pytorch_with_examples.html" rel="prev" title="Learning PyTorch with Examples"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">Warm-up: numpy</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_tensor/two_layer_net_numpy.html b/beginner/examples_tensor/two_layer_net_numpy.html
new file mode 120000
index 00000000000..1327fa851b4
--- /dev/null
+++ b/beginner/examples_tensor/two_layer_net_numpy.html
@@ -0,0 +1 @@
+beginner/examples_tensor/polynomial_numpy.html
\ No newline at end of file
diff --git a/beginner/examples_tensor/two_layer_net_tensor.html b/beginner/examples_tensor/two_layer_net_tensor.html
deleted file mode 100644
index 03f54270045..00000000000
--- a/beginner/examples_tensor/two_layer_net_tensor.html
+++ /dev/null
@@ -1,598 +0,0 @@
-
-<!DOCTYPE html>
-
-<!--[if IE 8]><html class="no-js lt-ie9" lang="en" > <![endif]-->
-<!--[if gt IE 8]><!--> <html class="no-js" lang="en"> <!--<![endif]-->
-<head>
-<meta charset="utf-8"/>
-<meta content="width=device-width, initial-scale=1.0" name="viewport"/>
-<title>PyTorch: Tensors — PyTorch Tutorials 1.7.0 documentation</title>
-<link href="../../_static/css/theme.css" rel="stylesheet" type="text/css"/>
-<!-- <link rel="stylesheet" href="../../_static/pygments.css" type="text/css" /> -->
-<link href="../../_static/copybutton.css" rel="stylesheet" type="text/css"/>
-<link href="../../_static/gallery.css" rel="stylesheet" type="text/css"/>
-<link href="../../genindex.html" rel="index" title="Index"/>
-<link href="../../search.html" rel="search" title="Search"/>
-<link href="../examples_autograd/two_layer_net_autograd.html" rel="next" title="PyTorch: Tensors and autograd"/>
-<link href="two_layer_net_numpy.html" rel="prev" title="Warm-up: numpy"/>
-<script src="../../_static/js/modernizr.min.js"></script>
-<!-- Preload the theme fonts -->
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-book.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-Medium.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/FreightSans/freight-sans-medium-italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="../../_static/fonts/IBMPlexMono/IBMPlexMono-SemiBold.woff2" rel="preload" type="font/woff2"/>
-<!-- Preload the katex fonts -->
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Math-Italic.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Main-Bold.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size1-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size4-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size2-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Size3-Regular.woff2" rel="preload" type="font/woff2"/>
-<link as="font" crossorigin="anonymous" href="https://cdn.jsdelivr.net/npm/katex@0.10.0/dist/fonts/KaTeX_Caligraphic-Regular.woff2" rel="preload" type="font/woff2"/>
-</head>
-<div class="container-fluid header-holder tutorials-header" id="header-holder">
-<div class="container">
-<div class="header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<div class="ecosystem-dropdown">
-<a data-toggle="ecosystem-dropdown" id="dropdownMenuButton">
-                Ecosystem
-              </a>
-<div class="ecosystem-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/hub">
-<span class="dropdown-title">Models (Beta)</span>
-<p>Discover, publish, and reuse pre-trained models</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/ecosystem">
-<span class="dropdown-title">Tools &amp; Libraries</span>
-<p>Explore the ecosystem of tools and libraries</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<div class="resources-dropdown">
-<a data-toggle="resources-dropdown" id="resourcesDropdownButton">
-                Resources
-              </a>
-<div class="resources-dropdown-menu">
-<a "="" class="nav-dropdown-item" href="https://pytorch.org/resources">
-<span class="dropdown-title">Developer Resources</span>
-<p>Find resources and get questions answered</p>
-</a>
-<a class="nav-dropdown-item" href="https://pytorch.org/features">
-<span class="dropdown-title">About</span>
-<p>Learn about PyTorch’s features and capabilities</p>
-</a>
-</div>
-</div>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-<a class="main-menu-open-button" data-behavior="open-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<body class="pytorch-body">
-<div class="table-of-contents-link-wrapper">
-<span>Table of Contents</span>
-<a class="toggle-table-of-contents" data-behavior="toggle-table-of-contents" href="#"></a>
-</div>
-<nav class="pytorch-left-menu" data-toggle="wy-nav-shift" id="pytorch-left-menu">
-<div class="pytorch-side-scroll">
-<div aria-label="main navigation" class="pytorch-menu pytorch-menu-vertical" data-spy="affix" role="navigation">
-<div class="pytorch-left-menu-search">
-<div class="version">
-                  1.7.0
-                </div>
-<div role="search">
-<form action="../../search.html" class="wy-form" id="rtd-search-form" method="get">
-<input name="q" placeholder="Search Tutorials" type="text"/>
-<input name="check_keywords" type="hidden" value="yes"/>
-<input name="area" type="hidden" value="default"/>
-</form>
-</div>
-</div>
-<p class="caption"><span class="caption-text">PyTorch Recipes</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../recipes/recipes_index.html">See All Recipes</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Learning PyTorch</span></p>
-<ul class="current">
-<li class="toctree-l1"><a class="reference internal" href="../deep_learning_60min_blitz.html">Deep Learning with PyTorch: A 60 Minute Blitz</a></li>
-<li class="toctree-l1 current"><a class="reference internal" href="../pytorch_with_examples.html">Learning PyTorch with Examples</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../nn_tutorial.html">What is <cite>torch.nn</cite> <em>really</em>?</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/tensorboard_tutorial.html">Visualizing Models, Data, and Training with TensorBoard</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Image/Video</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/torchvision_tutorial.html">TorchVision Object Detection Finetuning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../transfer_learning_tutorial.html">Transfer Learning for Computer Vision Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../fgsm_tutorial.html">Adversarial Example Generation</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../dcgan_faces_tutorial.html">DCGAN Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Audio</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../audio_preprocessing_tutorial.html">Audio I/O and Pre-Processing with torchaudio</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/speech_command_recognition_with_torchaudio.html">SyntaxError</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Text</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../transformer_tutorial.html">Sequence-to-Sequence Modeling with nn.Transformer and TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_classification_tutorial.html">NLP From Scratch: Classifying Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/char_rnn_generation_tutorial.html">NLP From Scratch: Generating Names with a Character-Level RNN</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/seq2seq_translation_tutorial.html">NLP From Scratch: Translation with a Sequence to Sequence Network and Attention</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../text_sentiment_ngrams_tutorial.html">Text Classification with TorchText</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../torchtext_translation_tutorial.html">Language Translation with TorchText</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Reinforcement Learning</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/reinforcement_q_learning.html">Reinforcement Learning (DQN) Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Deploying PyTorch Models in Production</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/flask_rest_api_tutorial.html">Deploying PyTorch in Python via a REST API with Flask</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../Intro_to_TorchScript_tutorial.html">Introduction to TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_export.html">Loading a TorchScript Model in C++</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/super_resolution_with_onnxruntime.html">(optional) Exporting a Model from PyTorch to ONNX and Running it using ONNX Runtime</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Frontend APIs</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/named_tensor_tutorial.html">(prototype) Introduction to Named Tensors in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/memory_format_tutorial.html">(beta) Channels Last Memory Format in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_frontend.html">Using the PyTorch C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_extension.html">Custom C++ and CUDA Extensions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_ops.html">Extending TorchScript with Custom C++ Operators</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch_script_custom_classes.html">Extending TorchScript with Custom C++ Classes</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/torch-script-parallelism.html">Dynamic Parallelism in TorchScript</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/cpp_autograd.html">Autograd in C++ Frontend</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dispatcher.html">Registering a Dispatched Operator in C++</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Model Optimization</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../hyperparameter_tuning_tutorial.html">Hyperparameter tuning with Ray Tune</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/pruning_tutorial.html">Pruning Tutorial</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/dynamic_quantization_tutorial.html">(beta) Dynamic Quantization on an LSTM Word Language Model</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dynamic_quantization_bert_tutorial.html">(beta) Dynamic Quantization on BERT</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/static_quantization_tutorial.html">(beta) Static Quantization with Eager Mode in PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/quantized_transfer_learning_tutorial.html">(beta) Quantized Transfer Learning for Computer Vision Tutorial</a></li>
-</ul>
-<p class="caption"><span class="caption-text">Parallel and Distributed Training</span></p>
-<ul>
-<li class="toctree-l1"><a class="reference internal" href="../dist_overview.html">PyTorch Distributed Overview</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/model_parallel_tutorial.html">Single-Machine Model Parallel Best Practices</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/ddp_tutorial.html">Getting Started with Distributed Data Parallel</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_tuto.html">Writing Distributed Applications with PyTorch</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_tutorial.html">Getting Started with Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_param_server_tutorial.html">Implementing a Parameter Server Using Distributed RPC Framework</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/dist_pipeline_parallel_tutorial.html">Distributed Pipeline Parallelism Using RPC</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../intermediate/rpc_async_execution.html">Implementing Batch RPC Processing Using Asynchronous Executions</a></li>
-<li class="toctree-l1"><a class="reference internal" href="../../advanced/rpc_ddp_tutorial.html">Combining Distributed DataParallel with Distributed RPC Framework</a></li>
-</ul>
-</div>
-</div>
-</nav>
-<div class="pytorch-container">
-<div class="pytorch-page-level-bar" id="pytorch-page-level-bar">
-<div class="pytorch-breadcrumbs-wrapper">
-<div aria-label="breadcrumbs navigation" role="navigation">
-<ul class="pytorch-breadcrumbs">
-<li>
-<a href="../../index.html">
-          
-            Tutorials
-          
-        </a> &gt;
-      </li>
-<li><a href="../pytorch_with_examples.html">Learning PyTorch with Examples</a> &gt;</li>
-<li>PyTorch: Tensors</li>
-<li class="pytorch-breadcrumbs-aside">
-<a href="../../_sources/beginner/examples_tensor/two_layer_net_tensor.rst.txt" rel="nofollow"><img src="../../_static/images/view-page-source-icon.svg"/></a>
-</li>
-</ul>
-</div>
-</div>
-<div class="pytorch-shortcuts-wrapper" id="pytorch-shortcuts-wrapper">
-          Shortcuts
-        </div>
-</div>
-<section class="pytorch-content-wrap" data-toggle="wy-nav-shift" id="pytorch-content-wrap">
-<div class="pytorch-content-left">
-<div class="pytorch-call-to-action-links">
-<div id="tutorial-type">beginner/examples_tensor/two_layer_net_tensor</div>
-<div id="google-colab-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-colab.svg"/>
-<div class="call-to-action-desktop-view">Run in Google Colab</div>
-<div class="call-to-action-mobile-view">Colab</div>
-</div>
-<div id="download-notebook-link">
-<img class="call-to-action-notebook-img" src="../../_static/images/pytorch-download.svg"/>
-<div class="call-to-action-desktop-view">Download Notebook</div>
-<div class="call-to-action-mobile-view">Notebook</div>
-</div>
-<div id="github-view-link">
-<img class="call-to-action-img" src="../../_static/images/pytorch-github.svg"/>
-<div class="call-to-action-desktop-view">View on GitHub</div>
-<div class="call-to-action-mobile-view">GitHub</div>
-</div>
-</div>
-<div class="rst-content">
-<div class="main-content" itemscope="itemscope" itemtype="http://schema.org/Article" role="main">
-<article class="pytorch-article" id="pytorch-article" itemprop="articleBody">
-<div class="sphx-glr-download-link-note admonition note">
-<p class="first admonition-title">Note</p>
-<p class="last">Click <a class="reference internal" href="#sphx-glr-download-beginner-examples-tensor-two-layer-net-tensor-py"><span class="std std-ref">here</span></a> to download the full example code</p>
-</div>
-<div class="sphx-glr-example-title section" id="pytorch-tensors">
-<span id="sphx-glr-beginner-examples-tensor-two-layer-net-tensor-py"></span><h1>PyTorch: Tensors<a class="headerlink" href="#pytorch-tensors" title="Permalink to this headline">¶</a></h1>
-<p>A fully-connected ReLU network with one hidden layer and no biases, trained to
-predict y from x by minimizing squared Euclidean distance.</p>
-<p>This implementation uses PyTorch tensors to manually compute the forward pass,
-loss, and backward pass.</p>
-<p>A PyTorch Tensor is basically the same as a numpy array: it does not know
-anything about deep learning or computational graphs or gradients, and is just
-a generic n-dimensional array to be used for arbitrary numeric computation.</p>
-<p>The biggest difference between a numpy array and a PyTorch Tensor is that
-a PyTorch Tensor can run on either CPU or GPU. To run operations on the GPU,
-just cast the Tensor to a cuda datatype.</p>
-<div class="highlight-default notranslate"><div class="highlight"><pre><span></span><span class="kn">import</span> <span class="nn">torch</span>
-
-
-<span class="n">dtype</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">float</span>
-<span class="n">device</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">device</span><span class="p">(</span><span class="s2">"cpu"</span><span class="p">)</span>
-<span class="c1"># device = torch.device("cuda:0") # Uncomment this to run on GPU</span>
-
-<span class="c1"># N is batch size; D_in is input dimension;</span>
-<span class="c1"># H is hidden dimension; D_out is output dimension.</span>
-<span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">D_out</span> <span class="o">=</span> <span class="mi">64</span><span class="p">,</span> <span class="mi">1000</span><span class="p">,</span> <span class="mi">100</span><span class="p">,</span> <span class="mi">10</span>
-
-<span class="c1"># Create random input and output data</span>
-<span class="n">x</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_in</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-<span class="n">y</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">N</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-
-<span class="c1"># Randomly initialize weights</span>
-<span class="n">w1</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">D_in</span><span class="p">,</span> <span class="n">H</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-<span class="n">w2</span> <span class="o">=</span> <span class="n">torch</span><span class="o">.</span><span class="n">randn</span><span class="p">(</span><span class="n">H</span><span class="p">,</span> <span class="n">D_out</span><span class="p">,</span> <span class="n">device</span><span class="o">=</span><span class="n">device</span><span class="p">,</span> <span class="n">dtype</span><span class="o">=</span><span class="n">dtype</span><span class="p">)</span>
-
-<span class="n">learning_rate</span> <span class="o">=</span> <span class="mf">1e-6</span>
-<span class="k">for</span> <span class="n">t</span> <span class="ow">in</span> <span class="nb">range</span><span class="p">(</span><span class="mi">500</span><span class="p">):</span>
-    <span class="c1"># Forward pass: compute predicted y</span>
-    <span class="n">h</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w1</span><span class="p">)</span>
-    <span class="n">h_relu</span> <span class="o">=</span> <span class="n">h</span><span class="o">.</span><span class="n">clamp</span><span class="p">(</span><span class="nb">min</span><span class="o">=</span><span class="mi">0</span><span class="p">)</span>
-    <span class="n">y_pred</span> <span class="o">=</span> <span class="n">h_relu</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w2</span><span class="p">)</span>
-
-    <span class="c1"># Compute and print loss</span>
-    <span class="n">loss</span> <span class="o">=</span> <span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span><span class="o">.</span><span class="n">pow</span><span class="p">(</span><span class="mi">2</span><span class="p">)</span><span class="o">.</span><span class="n">sum</span><span class="p">()</span><span class="o">.</span><span class="n">item</span><span class="p">()</span>
-    <span class="k">if</span> <span class="n">t</span> <span class="o">%</span> <span class="mi">100</span> <span class="o">==</span> <span class="mi">99</span><span class="p">:</span>
-        <span class="nb">print</span><span class="p">(</span><span class="n">t</span><span class="p">,</span> <span class="n">loss</span><span class="p">)</span>
-
-    <span class="c1"># Backprop to compute gradients of w1 and w2 with respect to loss</span>
-    <span class="n">grad_y_pred</span> <span class="o">=</span> <span class="mf">2.0</span> <span class="o">*</span> <span class="p">(</span><span class="n">y_pred</span> <span class="o">-</span> <span class="n">y</span><span class="p">)</span>
-    <span class="n">grad_w2</span> <span class="o">=</span> <span class="n">h_relu</span><span class="o">.</span><span class="n">t</span><span class="p">()</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">grad_y_pred</span><span class="p">)</span>
-    <span class="n">grad_h_relu</span> <span class="o">=</span> <span class="n">grad_y_pred</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">w2</span><span class="o">.</span><span class="n">t</span><span class="p">())</span>
-    <span class="n">grad_h</span> <span class="o">=</span> <span class="n">grad_h_relu</span><span class="o">.</span><span class="n">clone</span><span class="p">()</span>
-    <span class="n">grad_h</span><span class="p">[</span><span class="n">h</span> <span class="o">&lt;</span> <span class="mi">0</span><span class="p">]</span> <span class="o">=</span> <span class="mi">0</span>
-    <span class="n">grad_w1</span> <span class="o">=</span> <span class="n">x</span><span class="o">.</span><span class="n">t</span><span class="p">()</span><span class="o">.</span><span class="n">mm</span><span class="p">(</span><span class="n">grad_h</span><span class="p">)</span>
-
-    <span class="c1"># Update weights using gradient descent</span>
-    <span class="n">w1</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">grad_w1</span>
-    <span class="n">w2</span> <span class="o">-=</span> <span class="n">learning_rate</span> <span class="o">*</span> <span class="n">grad_w2</span>
-</pre></div>
-</div>
-<p class="sphx-glr-timing"><strong>Total running time of the script:</strong> ( 0 minutes  0.000 seconds)</p>
-<div class="sphx-glr-footer class sphx-glr-footer-example docutils container" id="sphx-glr-download-beginner-examples-tensor-two-layer-net-tensor-py">
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/42443af84e4770f8d5353f2c6e48f033/two_layer_net_tensor.py"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Python</span> <span class="pre">source</span> <span class="pre">code:</span> <span class="pre">two_layer_net_tensor.py</span></code></a></div>
-<div class="sphx-glr-download docutils container">
-<a class="reference download internal" download="" href="../../_downloads/449b1270b788a2ddf451772f6a4e7470/two_layer_net_tensor.ipynb"><code class="xref download docutils literal notranslate"><span class="pre">Download</span> <span class="pre">Jupyter</span> <span class="pre">notebook:</span> <span class="pre">two_layer_net_tensor.ipynb</span></code></a></div>
-</div>
-<p class="sphx-glr-signature"><a class="reference external" href="https://sphinx-gallery.readthedocs.io">Gallery generated by Sphinx-Gallery</a></p>
-</div>
-</article>
-</div>
-<footer>
-<div aria-label="footer navigation" class="rst-footer-buttons" role="navigation">
-<a accesskey="n" class="btn btn-neutral float-right" href="../examples_autograd/two_layer_net_autograd.html" rel="next" title="PyTorch: Tensors and autograd">Next <img class="next-page" src="../../_static/images/chevron-right-orange.svg"/></a>
-<a accesskey="p" class="btn btn-neutral" href="two_layer_net_numpy.html" rel="prev" title="Warm-up: numpy"><img class="previous-page" src="../../_static/images/chevron-right-orange.svg"/> Previous</a>
-</div>
-<hr class="helpful-hr hr-top"/>
-<div class="helpful-container">
-<div class="helpful-question">Was this helpful?</div>
-<div class="helpful-question yes-link" data-behavior="was-this-helpful-event" data-response="yes">Yes</div>
-<div class="helpful-question no-link" data-behavior="was-this-helpful-event" data-response="no">No</div>
-<div class="was-helpful-thank-you">Thank you</div>
-</div>
-<hr class="helpful-hr hr-bottom"/>
-<div role="contentinfo">
-<p>
-        © Copyright 2017, PyTorch.
-
-    </p>
-</div>
-<div>
-        Built with <a href="http://sphinx-doc.org/">Sphinx</a> using a <a href="https://github.com/rtfd/sphinx_rtd_theme">theme</a> provided by <a href="https://readthedocs.org">Read the Docs</a>.
-      </div>
-</footer>
-</div>
-</div>
-<div class="pytorch-content-right" id="pytorch-content-right">
-<div class="pytorch-right-menu" id="pytorch-right-menu">
-<div class="pytorch-side-scroll" id="pytorch-side-scroll-right">
-<ul>
-<li><a class="reference internal" href="#">PyTorch: Tensors</a></li>
-</ul>
-</div>
-</div>
-</div>
-</section>
-</div>
-<script data-url_root="../../" id="documentation_options" src="../../_static/documentation_options.js" type="text/javascript"></script>
-<script src="../../_static/jquery.js" type="text/javascript"></script>
-<script src="../../_static/underscore.js" type="text/javascript"></script>
-<script src="../../_static/doctools.js" type="text/javascript"></script>
-<script src="../../_static/clipboard.min.js" type="text/javascript"></script>
-<script src="../../_static/copybutton.js" type="text/javascript"></script>
-<script async="async" src="https://cdnjs.cloudflare.com/ajax/libs/mathjax/2.7.1/MathJax.js?config=TeX-AMS-MML_HTMLorMML" type="text/javascript"></script>
-<script src="../../_static/js/vendor/popper.min.js" type="text/javascript"></script>
-<script src="../../_static/js/vendor/bootstrap.min.js" type="text/javascript"></script>
-<script src="https://cdnjs.cloudflare.com/ajax/libs/list.js/1.5.0/list.min.js"></script>
-<script src="../../_static/js/theme.js" type="text/javascript"></script>
-<script type="text/javascript">
-      jQuery(function () {
-          SphinxRtdTheme.Navigation.enable(true);
-      });
-  </script>
-<script async="" src="https://www.googletagmanager.com/gtag/js?id=UA-117752657-2"></script>
-<script>
-
-  window.dataLayer = window.dataLayer || [];
-
-  function gtag(){dataLayer.push(arguments);}
-
-  gtag('js', new Date());
-  gtag('config', 'UA-117752657-2');
-
-</script>
-<script>
-  !function(f,b,e,v,n,t,s)
-  {if(f.fbq)return;n=f.fbq=function(){n.callMethod?
-  n.callMethod.apply(n,arguments):n.queue.push(arguments)};
-  if(!f._fbq)f._fbq=n;n.push=n;n.loaded=!0;n.version='2.0';
-  n.queue=[];t=b.createElement(e);t.async=!0;
-  t.src=v;s=b.getElementsByTagName(e)[0];
-  s.parentNode.insertBefore(t,s)}(window,document,'script',
-  'https://connect.facebook.net/en_US/fbevents.js');
-  fbq('init', '243028289693773');
-  fbq('track', 'PageView');
-
-  $("[data-behavior='call-to-action-event']").on('click', function(){
-    fbq('trackCustom', "Download", {
-      tutorialTitle: $('h1:first').text(),
-      downloadLink: this.href,
-      tutorialLink: window.location.href,
-      downloadTitle: $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': 'Download',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', 'click', {
-      'event_category': $(this).attr("data-response"),
-      'event_label': $("h1").first().text(),
-      'tutorial_link': window.location.href
-    });
-   });
-
-   $("[data-behavior='was-this-helpful-event']").on('click', function(){
-    $(".helpful-question").hide();
-    $(".was-helpful-thank-you").show();
-
-    fbq('trackCustom', "Was this Helpful?", {
-      tutorialLink: window.location.href,
-      tutorialTitle: $('h1:first').text(),
-      helpful: $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $(this).attr("data-response")
-    });
-
-    gtag('event', $(this).attr("data-response"), {
-      'event_category': 'Was this Helpful?',
-      'event_label': $("h1").first().text()
-    });
-   });
-
-   if (location.pathname == "/") {
-     $(".helpful-container").hide();
-     $(".hr-bottom").hide();
-   }
-</script>
-<noscript>
-<img height="1" src="https://www.facebook.com/tr?id=243028289693773&amp;ev=PageView
-  &amp;noscript=1" width="1"/>
-</noscript>
-<img alt="" height="1" src="https://www.googleadservices.com/pagead/conversion/795629140/?label=txkmCPmdtosBENSssfsC&amp;guid=ON&amp;script=0" style="border-style:none;" width="1"/>
-<!-- Begin Footer -->
-<div class="container-fluid docs-tutorials-resources" id="docs-tutorials-resources">
-<div class="container">
-<div class="row">
-<div class="col-md-4 text-center">
-<h2>Docs</h2>
-<p>Access comprehensive developer documentation for PyTorch</p>
-<a class="with-right-arrow" href="https://pytorch.org/docs/stable/index.html">View Docs</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Tutorials</h2>
-<p>Get in-depth tutorials for beginners and advanced developers</p>
-<a class="with-right-arrow" href="https://pytorch.org/tutorials">View Tutorials</a>
-</div>
-<div class="col-md-4 text-center">
-<h2>Resources</h2>
-<p>Find development resources and get your questions answered</p>
-<a class="with-right-arrow" href="https://pytorch.org/resources">View Resources</a>
-</div>
-</div>
-</div>
-</div>
-<footer class="site-footer">
-<div class="container footer-container">
-<div class="footer-logo-wrapper">
-<a class="footer-logo" href="https://pytorch.org/"></a>
-</div>
-<div class="footer-links-wrapper">
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/">PyTorch</a></li>
-<li><a href="https://pytorch.org/get-started">Get Started</a></li>
-<li><a href="https://pytorch.org/features">Features</a></li>
-<li><a href="https://pytorch.org/ecosystem">Ecosystem</a></li>
-<li><a href="https://pytorch.org/blog/">Blog</a></li>
-<li><a href="https://github.com/pytorch/pytorch/blob/master/CONTRIBUTING.md">Contributing</a></li>
-</ul>
-</div>
-<div class="footer-links-col">
-<ul>
-<li class="list-title"><a href="https://pytorch.org/resources">Resources</a></li>
-<li><a href="https://pytorch.org/tutorials">Tutorials</a></li>
-<li><a href="https://pytorch.org/docs/stable/index.html">Docs</a></li>
-<li><a href="https://discuss.pytorch.org" target="_blank">Discuss</a></li>
-<li><a href="https://github.com/pytorch/pytorch/issues" target="_blank">Github Issues</a></li>
-<li><a href="https://pytorch.org/assets/brand-guidelines/PyTorch-Brand-Guidelines.pdf" target="_blank">Brand Guidelines</a></li>
-</ul>
-</div>
-<div class="footer-links-col follow-us-col">
-<ul>
-<li class="list-title">Stay Connected</li>
-<li>
-<div id="mc_embed_signup">
-<form action="https://twitter.us14.list-manage.com/subscribe/post?u=75419c71fe0a935e53dfa4a3f&amp;id=91d0dccd39" class="email-subscribe-form validate" id="mc-embedded-subscribe-form" method="post" name="mc-embedded-subscribe-form" novalidate="" target="_blank">
-<div class="email-subscribe-form-fields-wrapper" id="mc_embed_signup_scroll">
-<div class="mc-field-group">
-<label for="mce-EMAIL" style="display:none;">Email Address</label>
-<input class="required email" id="mce-EMAIL" name="EMAIL" placeholder="Email Address" type="email" value=""/>
-</div>
-<div class="clear" id="mce-responses">
-<div class="response" id="mce-error-response" style="display:none"></div>
-<div class="response" id="mce-success-response" style="display:none"></div>
-</div> <!-- real people should not fill this in and expect good things - do not remove this or risk form bot signups-->
-<div aria-hidden="true" style="position: absolute; left: -5000px;"><input name="b_75419c71fe0a935e53dfa4a3f_91d0dccd39" tabindex="-1" type="text" value=""/></div>
-<div class="clear">
-<input class="button email-subscribe-button" id="mc-embedded-subscribe" name="subscribe" type="submit" value=""/>
-</div>
-</div>
-</form>
-</div>
-</li>
-</ul>
-<div class="footer-social-icons">
-<a class="facebook" href="https://www.facebook.com/pytorch" target="_blank"></a>
-<a class="twitter" href="https://twitter.com/pytorch" target="_blank"></a>
-<a class="youtube" href="https://www.youtube.com/pytorch" target="_blank"></a>
-</div>
-</div>
-</div>
-</div>
-</footer>
-<div class="cookie-banner-wrapper">
-<div class="container">
-<p class="gdpr-notice">To analyze traffic and optimize your experience, we serve cookies on this site. By clicking or navigating, you agree to allow our usage of cookies. As the current maintainers of this site, Facebook’s Cookies Policy applies. Learn more, including about available controls: <a href="https://www.facebook.com/policies/cookies/">Cookies Policy</a>.</p>
-<img class="close-button" src="../../_static/images/pytorch-x.svg">
-</img></div>
-</div>
-<!-- End Footer -->
-<!-- Begin Mobile Menu -->
-<div class="mobile-main-menu">
-<div class="container-fluid">
-<div class="container">
-<div class="mobile-main-menu-header-container">
-<a aria-label="PyTorch" class="header-logo" href="https://pytorch.org/"></a>
-<a class="main-menu-close-button" data-behavior="close-mobile-menu" href="#"></a>
-</div>
-</div>
-</div>
-<div class="mobile-main-menu-links-container">
-<div class="main-menu">
-<ul>
-<li>
-<a href="https://pytorch.org/get-started">Get Started</a>
-</li>
-<li>
-<a href="https://pytorch.org/features">Features</a>
-</li>
-<li>
-<a href="https://pytorch.org/ecosystem">Ecosystem</a>
-</li>
-<li>
-<a href="https://pytorch.org/mobile">Mobile</a>
-</li>
-<li>
-<a href="https://pytorch.org/hub">PyTorch Hub</a>
-</li>
-<li>
-<a href="https://pytorch.org/blog/">Blog</a>
-</li>
-<li class="active">
-<a href="https://pytorch.org/tutorials">Tutorials</a>
-</li>
-<li>
-<a href="https://pytorch.org/docs/stable/index.html">Docs</a>
-</li>
-<li>
-<a href="https://pytorch.org/resources">Resources</a>
-</li>
-<li>
-<a href="https://github.com/pytorch/pytorch">Github</a>
-</li>
-</ul>
-</div>
-</div>
-</div>
-<!-- End Mobile Menu -->
-<script src="../../_static/js/vendor/anchor.min.js" type="text/javascript"></script>
-<script type="text/javascript">
-    $(document).ready(function() {
-      mobileMenu.bind();
-      mobileTOC.bind();
-      pytorchAnchors.bind();
-      sideMenus.bind();
-      scrollToAnchor.bind();
-      highlightNavigation.bind();
-      mainMenuDropdown.bind();
-      filterTags.bind();
-
-      // Add class to links that have code blocks, since we cannot create links in code blocks
-      $("article.pytorch-article a span.pre").each(function(e) {
-        $(this).closest("a").addClass("has-code");
-      });
-    })
-  </script>
-</body>
-</html>
\ No newline at end of file
diff --git a/beginner/examples_tensor/two_layer_net_tensor.html b/beginner/examples_tensor/two_layer_net_tensor.html
new file mode 120000
index 00000000000..c063e8c7a2d
--- /dev/null
+++ b/beginner/examples_tensor/two_layer_net_tensor.html
@@ -0,0 +1 @@
+beginner/examples_tensor/polynomial_tensor.html
\ No newline at end of file