{ "cells": [ { "cell_type": "markdown", "metadata": {}, "source": [ "# DS4420: Fun with autoencoders and self-supervision" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "*Your name*: " ] }, { "cell_type": "code", "execution_count": 179, "metadata": {}, "outputs": [], "source": [ "import numpy as np \n", "import matplotlib.pyplot as plt\n", "\n", "import torch\n", "from torch import nn\n", "# conda install -c pytorch torchvision\n", "import torchvision\n", "\n", "# note: if you cannot get torchvision installed \n", "# using the above sequence, you can resort to \n", "# the colab version here: \n", "# -- just be sure to download and then upload\n", "# the notebook to blackboard when complete.\n", "fMNIST = torchvision.datasets.FashionMNIST(\n", " root = './data/FashionMNIST',\n", " train = True,\n", " download = True) " ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Once again, we are playing with Fashion-MNIST here, following the last few lectures." ] }, { "cell_type": "code", "execution_count": 180, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 180, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAAOwUlEQVR4nO3df4xV9ZnH8c/jDPiDHwoKBMF12KKyG/8QJbphzcaNgbj8g2isYEzcbJOpWrUmm7ikS1ITNTG7WzfxnyY0NWU3XZsmamqazbYGm7V/VYFYQbAVG34MTBgBDYMO8uvZP+ZMd4pzvt/xnnvuufC8X8nkzpznnnueOcOHe+793nO+5u4CcOG7qOkGAHQGYQeCIOxAEIQdCIKwA0H0dnJjZsZb/0DN3N0mWl7pmd3M7jKz35nZbjNbX+WxANTLWh1nN7MeSb+XtELSgKR3JK1z952JdXhmB2pWxzP7rZJ2u/sf3P2kpJ9IWl3h8QDUqErYF0jaP+7ngWLZnzCzfjPbYmZbKmwLQEVV3qCb6FDhS4fp7r5R0kaJw3igSVWe2QckXTPu54WSDlZrB0BdqoT9HUnXmdkiM5sqaa2k19vTFoB2a/kw3t1Pm9ljkn4hqUfSS+7+fts6A9BWLQ+9tbQxXrMDtavlQzUAzh+EHQiCsANBEHYgCMIOBEHYgSAIOxAEYQeCIOxAEIQdCIKwA0EQdiAIwg4EQdiBIAg7EARhB4Ig7EAQhB0IgrADQRB2IAjCDgRB2IEgCDsQBGEHgiDsQBCEHQiCsANBEHYgCMIOBEHYgSBanp9dksxsj6RhSWcknXb3Ze1oCkD7VQp74W/d/XAbHgdAjTiMB4KoGnaX9Esz22pm/RPdwcz6zWyLmW2puC0AFZi7t76y2dXuftDM5kp6Q9Lj7v5W4v6tbwzApLi7TbS80jO7ux8sbockvSbp1iqPB6A+LYfdzKaZ2Yyx7yWtlLSjXY0BaK8q78bPk/SamY09zn+5+/+0pSsAbVfpNftX3hiv2YHa1fKaHcD5g7ADQRB2IAjCDgRB2IEgCDsQBGEHgiDsQBCEHQiCsANBEHYgCMIOBEHYgSDaccFJVFScJtyy1JmLPT09yXXPnj3b8mNLUm9v+p/Q6dOnk/UqLroo/VyV+93qNGXKlGQ9tV/qOhOVZ3YgCMIOBEHYgSAIOxAEYQeCIOxAEIQdCIKry17gmhwHr+qRRx5J1jds2JCsL1iwoJ3tnDe4uiwQHGEHgiDsQBCEHQiCsANBEHYgCMIOBME4+3kgd757J/+G51q3bl2yvnTp0tLafffdl1x3ZGQkWT916lSyvnPnztJaru+qpk6dmqw/9dRTpbVnn3220rZbHmc3s5fMbMjMdoxbNtvM3jCzD4vbWZW6A1C7yRzG/0jSXecsWy9ps7tfJ2lz8TOALpYNu7u/JenoOYtXS9pUfL9J0t1t7gtAm7V6Dbp57j4oSe4+aGZzy+5oZv2S+lvcDoA2qf2Ck+6+UdJGiTfogCa1OvR2yMzmS1JxO9S+lgDUodWwvy7poeL7hyT9rD3tAKhL9jDezF6WdIekq8xsQNJ3JT0v6adm9g1J+ySlB0yDqzpOXmUcffHixcl6bqx7+fLlyfrKlSuT9Y8++qi0NjAwkFz32LFjyXpfX1+yvmrVqmS9TmvXrk3Wb7vttg518v+yYXf3sk8f3NnmXgDUiI/LAkEQdiAIwg4EQdiBIAg7EMQFM2Vz1el7c6cknjx58iv3NKbqKahXXHFFsv7cc8+V1u6///7kup9//nmyPjg4mKy//fbbyXpq6uJLL700ue4HH3yQrC9cuDBZf+aZZ5L1lLlzSz8BLim/X1944YVkfcmSJaW1W265Jbnu1q1bk/UyPLMDQRB2IAjCDgRB2IEgCDsQBGEHgiDsQBDn1aWkU6eK5sbZz5w5U2XTldx5Z/oEwXvvvTdZf+CBB5L1I0eOlNYOHDiQXDc3ZfPMmTOT9csuuyxZT10OOjfGP3369GR9aCh9zZQ5c+aU1nLTOecuY719+/ZkffXq1cn6JZdcUlqr+nszZTMQHGEHgiDsQBCEHQiCsANBEHYgCMIOBHFejbM36YknniitPfzww8l1582bl6xXvaRy6jMEuW3n5K4DkJO6DkDu9/riiy+S9RkzZiTrF198cWlt7969yXXXrFmTrOds2LAhWX/00UdLa/v27Uuu++CDD5bW9u/frxMnTjDODkRG2IEgCDsQBGEHgiDsQBCEHQiCsANBdNU4+80335xcf8WKFaW1G264Iblu6vxhSbr66quT9dQ5xrlryn/22WfJ+uWXX56s56Z8Tv1uPT09yXVz55Snrvsu5XtL7ZvcOHpuv+b+7aZ6u/7661teV8qfc5777MTHH39cWstdI+DNN98srb344osaGBhobZzdzF4ysyEz2zFu2dNmdsDM3i2+mpsIG8CkTOYw/keS7ppg+b+7+03F13+3ty0A7ZYNu7u/JeloB3oBUKMqb9A9ZmbvFYf5s8ruZGb9ZrbFzLZU2BaAiloN+/clfU3STZIGJX2v7I7uvtHdl7n7sha3BaANWgq7ux9y9zPuflbSDyTd2t62ALRbS2E3s/njflwjaUfZfQF0h+z87Gb2sqQ7JF1lZgOSvivpDjO7SZJL2iPpm5PZ2Jw5c5LzWt9zzz3J9VPzeVcZ75Xy48mp8eiqY7K5c8Zz4/Sffvppaa23N/0nzm079/mE3O+eOqc89xmA3Pztud5Sf9PcufS56+l/8sknldZP/W658/RblQ27u6+bYPEPa+gFQI34uCwQBGEHgiDsQBCEHQiCsANBdPQU197eXk8NQy1ZsiS5/vLly0trN954Y3Lda6+9Nlm/8sork/XUUElueCs3XXRuuulcPTU1cW5oLTf8NXXq1GQ997vnek85fvx4sp4bkkwNt+aGxnK5OHHiRLKe+71TQ3fTpk1Lrvv444+X1rZt26bh4WEuJQ1ERtiBIAg7EARhB4Ig7EAQhB0IgrADQXR8nD11+t6pU6eS6+fGVVNSp1pK0qJFi5L1xYsXl9b6+vqS6+YuU131NNLUmG5unP3w4cPJem6s+8iRI8l66vTbVG0y9ZGRkWQ9d5nslNznC3J/k5zUfs/9O89l1t0ZZwciI+xAEIQdCIKwA0EQdiAIwg4EQdiBILpqyubcebwzZ85MPXZrTRVy5zenxmxz4+S5zw/k5M45T/0Nc+dV53qv83z33LZz9dylplP/XnKXDs/9zXLn8eemXR4eHm5523v37i2t7d69WyMjI4yzA5ERdiAIwg4EQdiBIAg7EARhB4Ig7EAQXTXO3qTcmG1qXDY3Fp0bc82da58bE07J9ZYbh899/qDK9quOdafGqqX0Zy9y4+S53nL7Jff4qfVz5+EfPHgwWW/5fHYzu8bMfmVmu8zsfTP7drF8tpm9YWYfFrezco8FoDmTOYw/Lekf3f0vJP2VpG+Z2V9KWi9ps7tfJ2lz8TOALpUNu7sPuvu24vthSbskLZC0WtKm4m6bJN1dV5MAqku/sDiHmfVJWirpN5LmufugNPofgpnNLVmnX1J/tTYBVDXpsJvZdEmvSHrS3Y9N9sQTd98oaWPxGF37Bh1woZvU0JuZTdFo0H/s7q8Wiw+Z2fyiPl/SUD0tAmiH7NCbjT6Fb5J01N2fHLf8XyUdcffnzWy9pNnu/lTmsXhmB2pWNvQ2mbDfLunXkrZLGrsI+Xc0+rr9p5L+TNI+Sfe5+9HMYxF2oGYth72dCDtQPyaJAIIj7EAQhB0IgrADQRB2IAjCDgRB2IEgCDsQBGEHgiDsQBCEHQiCsANBEHYgCMIOBEHYgSAIOxAEYQeCIOxAEIQdCIKwA0EQdiAIwg4EQdiBIAg7EARhB4Ig7EAQhB0IgrADQRB2IIhs2M3sGjP7lZntMrP3zezbxfKnzeyAmb1bfK2qv10ArZrM/OzzJc13921mNkPSVkl3S/q6pOPu/m+T3hhTNgO1K5uyuXcSKw5KGiy+HzazXZIWtLc9AHX7Sq/ZzaxP0lJJvykWPWZm75nZS2Y2q2SdfjPbYmZbKnUKoJLsYfwf72g2XdL/SnrO3V81s3mSDktySc9o9FD/HzKPwWE8ULOyw/hJhd3Mpkj6uaRfuPsLE9T7JP3c3W/MPA5hB2pWFvbJvBtvkn4oadf4oBdv3I1ZI2lH1SYB1Gcy78bfLunXkrZLOlss/o6kdZJu0uhh/B5J3yzezEs9Fs/sQM0qHca3C2EH6tfyYTyACwNhB4Ig7EAQhB0IgrADQRB2IAjCDgRB2IEgCDsQBGEHgiDsQBCEHQiCsANBEHYgiOwFJ9vssKS9436+qljWjbq1t27tS6K3VrWzt2vLCh09n/1LGzfb4u7LGmsgoVt769a+JHprVad64zAeCIKwA0E0HfaNDW8/pVt769a+JHprVUd6a/Q1O4DOafqZHUCHEHYgiEbCbmZ3mdnvzGy3ma1voocyZrbHzLYX01A3Oj9dMYfekJntGLdstpm9YWYfFrcTzrHXUG9dMY13YprxRvdd09Ofd/w1u5n1SPq9pBWSBiS9I2mdu+/saCMlzGyPpGXu3vgHMMzsbyQdl/QfY1Nrmdm/SDrq7s8X/1HOcvd/6pLentZXnMa7pt7Kphn/ezW479o5/Xkrmnhmv1XSbnf/g7uflPQTSasb6KPruftbko6es3i1pE3F95s0+o+l40p66wruPuju24rvhyWNTTPe6L5L9NURTYR9gaT9434eUHfN9+6SfmlmW82sv+lmJjBvbJqt4nZuw/2cKzuNdyedM8141+y7VqY/r6qJsE80NU03jf/9tbvfLOnvJH2rOFzF5Hxf0tc0OgfgoKTvNdlMMc34K5KedPdjTfYy3gR9dWS/NRH2AUnXjPt5oaSDDfQxIXc/WNwOSXpNoy87usmhsRl0i9uhhvv5I3c/5O5n3P2spB+owX1XTDP+iqQfu/urxeLG991EfXVqvzUR9nckXWdmi8xsqqS1kl5voI8vMbNpxRsnMrNpklaq+6aifl3SQ8X3D0n6WYO9/Ilumca7bJpxNbzvGp/+3N07/iVplUbfkf9I0j830UNJX38u6bfF1/tN9ybpZY0e1p3S6BHRNyRdKWmzpA+L29ld1Nt/anRq7/c0Gqz5DfV2u0ZfGr4n6d3ia1XT+y7RV0f2Gx+XBYLgE3RAEIQdCIKwA0EQdiAIwg4EQdiBIAg7EMT/AUGd8+8h8/s/AAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "from IPython.display import Image \n", "from matplotlib.pyplot import imshow\n", "%matplotlib inline\n", "imshow(np.asarray(fMNIST.data[6]), cmap='gray')" ] }, { "cell_type": "code", "execution_count": 181, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(60000, 784)" ] }, "execution_count": 181, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X = fMNIST.data\n", "X = np.array([x_i.flatten().numpy() for x_i in X])\n", "X = X / 255 # normalize\n", "X.shape" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## A brief detour / torch intro (or refresher)\n", "\n", "We're going to implement a few autoencoder (AE) variants in `torch`. \n", "\n", "Given that for some of you this may serve as something of an introduction to (or at least refresher for) `torch`, Here is one way to define and train a simple model.\n", "\n", "Note that you can also use the simple `Sequential` pipeline to build such straightforward models, but this style affords more flexibility (though overkill for something like this)." ] }, { "cell_type": "code", "execution_count": 182, "metadata": {}, "outputs": [], "source": [ "class SimpleMLP(nn.Module):\n", " def __init__(self, input_size=784, hidden_size=32, n_labels=10):\n", " '''\n", " In the initializer we setup model parameters/layers.\n", " '''\n", " super(SimpleMLP, self).__init__() \n", "\n", " self.input_size = input_size\n", " self.hidden_size = hidden_size\n", " self.n_labels = 10\n", " \n", " # input layer; from x -> z\n", " self.i = nn.Linear(self.input_size, self.hidden_size, bias=False)\n", " # nonlinear activation\n", " self.a = nn.ReLU()\n", " # output layer\n", " self.o = nn.Linear(self.hidden_size, 10)\n", " self.sm = nn.Softmax()\n", " \n", " def forward(self, X):\n", " '''\n", " The forward pass defines how inputs flow forward through\n", " the model (linking layers together).\n", " '''\n", " z = self.i(X)\n", " z = self.a(z)\n", " y_hat = self.o(z)\n", " return y_hat" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Now to actually train the model, we need to define an `optimizer` and a loss function." ] }, { "cell_type": "code", "execution_count": 183, "metadata": {}, "outputs": [], "source": [ "model = SimpleMLP().float()\n", "\n", "from torch import optim\n", "optimizer = optim.SGD(model.parameters(), lr=0.001, momentum=0.9)\n", "\n", "loss_function = nn.CrossEntropyLoss() " ] }, { "cell_type": "code", "execution_count": 184, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "tensor([9, 0, 0, ..., 3, 0, 5])" ] }, "execution_count": 184, "metadata": {}, "output_type": "execute_result" } ], "source": [ "y = fMNIST.targets\n", "y" ] }, { "cell_type": "code", "execution_count": 185, "metadata": {}, "outputs": [], "source": [ "# convert X to a torch tensor\n", "X = torch.tensor(X)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Let's take a look at making predictions and calculating a loss." ] }, { "cell_type": "code", "execution_count": 186, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "tensor(2.3589, grad_fn=)\n" ] } ], "source": [ "# make a prediction for the first 5 instances \n", "# (note that this is \"batched\"; we are pushing \n", "# through 5 instances at once)\n", "y_hat = model(X[:5,:].float())\n", "# calculate loss\n", "loss = loss_function(y_hat, y[:5])\n", "print(loss)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "And now take some number of passes over our training data, incurring loss, and performing backprop." ] }, { "cell_type": "code", "execution_count": 187, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 2.305\n", "epoch: 0, batch: 100 // loss: 1.929\n", "epoch: 0, batch: 200 // loss: 1.576\n", "epoch: 0, batch: 300 // loss: 1.377\n", "epoch: 0, batch: 400 // loss: 1.068\n", "epoch: 0, batch: 500 // loss: 1.100\n", "epoch: 0, batch: 600 // loss: 0.984\n", "epoch: 0, batch: 700 // loss: 0.792\n", "epoch: 0, batch: 800 // loss: 0.861\n", "epoch: 0, batch: 900 // loss: 0.682\n", "epoch: 0, batch: 1000 // loss: 0.832\n", "epoch: 0, batch: 1100 // loss: 0.547\n", "epoch: 0, batch: 1200 // loss: 0.574\n", "\n", "epoch: 1, batch: 0 // loss: 0.745\n", "epoch: 1, batch: 100 // loss: 0.593\n", "epoch: 1, batch: 200 // loss: 0.689\n", "epoch: 1, batch: 300 // loss: 0.644\n", "epoch: 1, batch: 400 // loss: 0.532\n", "epoch: 1, batch: 500 // loss: 0.638\n", "epoch: 1, batch: 600 // loss: 0.727\n", "epoch: 1, batch: 700 // loss: 0.405\n", "epoch: 1, batch: 800 // loss: 0.587\n", "epoch: 1, batch: 900 // loss: 0.369\n", "epoch: 1, batch: 1000 // loss: 0.702\n", "epoch: 1, batch: 1100 // loss: 0.356\n", "epoch: 1, batch: 1200 // loss: 0.446\n", "\n", "epoch: 2, batch: 0 // loss: 0.595\n", "epoch: 2, batch: 100 // loss: 0.479\n", "epoch: 2, batch: 200 // loss: 0.678\n", "epoch: 2, batch: 300 // loss: 0.514\n", "epoch: 2, batch: 400 // loss: 0.383\n", "epoch: 2, batch: 500 // loss: 0.534\n", "epoch: 2, batch: 600 // loss: 0.659\n", "epoch: 2, batch: 700 // loss: 0.322\n", "epoch: 2, batch: 800 // loss: 0.469\n", "epoch: 2, batch: 900 // loss: 0.271\n", "epoch: 2, batch: 1000 // loss: 0.668\n", "epoch: 2, batch: 1100 // loss: 0.271\n", "epoch: 2, batch: 1200 // loss: 0.404\n", "\n", "epoch: 3, batch: 0 // loss: 0.523\n", "epoch: 3, batch: 100 // loss: 0.408\n", "epoch: 3, batch: 200 // loss: 0.694\n", "epoch: 3, batch: 300 // loss: 0.457\n", "epoch: 3, batch: 400 // loss: 0.311\n", "epoch: 3, batch: 500 // loss: 0.498\n", "epoch: 3, batch: 600 // loss: 0.619\n", "epoch: 3, batch: 700 // loss: 0.296\n", "epoch: 3, batch: 800 // loss: 0.407\n", "epoch: 3, batch: 900 // loss: 0.221\n", "epoch: 3, batch: 1000 // loss: 0.658\n", "epoch: 3, batch: 1100 // loss: 0.227\n", "epoch: 3, batch: 1200 // loss: 0.379\n", "\n", "epoch: 4, batch: 0 // loss: 0.470\n", "epoch: 4, batch: 100 // loss: 0.372\n", "epoch: 4, batch: 200 // loss: 0.691\n", "epoch: 4, batch: 300 // loss: 0.421\n", "epoch: 4, batch: 400 // loss: 0.277\n", "epoch: 4, batch: 500 // loss: 0.480\n", "epoch: 4, batch: 600 // loss: 0.593\n", "epoch: 4, batch: 700 // loss: 0.285\n", "epoch: 4, batch: 800 // loss: 0.368\n", "epoch: 4, batch: 900 // loss: 0.191\n", "epoch: 4, batch: 1000 // loss: 0.654\n", "epoch: 4, batch: 1100 // loss: 0.201\n", "epoch: 4, batch: 1200 // loss: 0.352\n", "\n", "epoch: 5, batch: 0 // loss: 0.428\n", "epoch: 5, batch: 100 // loss: 0.352\n", "epoch: 5, batch: 200 // loss: 0.670\n", "epoch: 5, batch: 300 // loss: 0.397\n", "epoch: 5, batch: 400 // loss: 0.258\n", "epoch: 5, batch: 500 // loss: 0.471\n", "epoch: 5, batch: 600 // loss: 0.576\n", "epoch: 5, batch: 700 // loss: 0.279\n", "epoch: 5, batch: 800 // loss: 0.340\n", "epoch: 5, batch: 900 // loss: 0.173\n", "epoch: 5, batch: 1000 // loss: 0.653\n", "epoch: 5, batch: 1100 // loss: 0.185\n", "epoch: 5, batch: 1200 // loss: 0.330\n", "\n", "epoch: 6, batch: 0 // loss: 0.399\n", "epoch: 6, batch: 100 // loss: 0.343\n", "epoch: 6, batch: 200 // loss: 0.645\n", "epoch: 6, batch: 300 // loss: 0.381\n", "epoch: 6, batch: 400 // loss: 0.244\n", "epoch: 6, batch: 500 // loss: 0.459\n", "epoch: 6, batch: 600 // loss: 0.566\n", "epoch: 6, batch: 700 // loss: 0.273\n", "epoch: 6, batch: 800 // loss: 0.322\n", "epoch: 6, batch: 900 // loss: 0.161\n", "epoch: 6, batch: 1000 // loss: 0.650\n", "epoch: 6, batch: 1100 // loss: 0.174\n", "epoch: 6, batch: 1200 // loss: 0.310\n", "\n", "epoch: 7, batch: 0 // loss: 0.375\n", "epoch: 7, batch: 100 // loss: 0.336\n", "epoch: 7, batch: 200 // loss: 0.620\n", "epoch: 7, batch: 300 // loss: 0.372\n", "epoch: 7, batch: 400 // loss: 0.234\n", "epoch: 7, batch: 500 // loss: 0.452\n", "epoch: 7, batch: 600 // loss: 0.556\n", "epoch: 7, batch: 700 // loss: 0.265\n", "epoch: 7, batch: 800 // loss: 0.311\n", "epoch: 7, batch: 900 // loss: 0.149\n", "epoch: 7, batch: 1000 // loss: 0.646\n", "epoch: 7, batch: 1100 // loss: 0.166\n", "epoch: 7, batch: 1200 // loss: 0.293\n", "\n", "epoch: 8, batch: 0 // loss: 0.358\n", "epoch: 8, batch: 100 // loss: 0.331\n", "epoch: 8, batch: 200 // loss: 0.600\n", "epoch: 8, batch: 300 // loss: 0.357\n", "epoch: 8, batch: 400 // loss: 0.226\n", "epoch: 8, batch: 500 // loss: 0.443\n", "epoch: 8, batch: 600 // loss: 0.546\n", "epoch: 8, batch: 700 // loss: 0.259\n", "epoch: 8, batch: 800 // loss: 0.302\n", "epoch: 8, batch: 900 // loss: 0.139\n", "epoch: 8, batch: 1000 // loss: 0.639\n", "epoch: 8, batch: 1100 // loss: 0.160\n", "epoch: 8, batch: 1200 // loss: 0.280\n", "\n", "epoch: 9, batch: 0 // loss: 0.345\n", "epoch: 9, batch: 100 // loss: 0.331\n", "epoch: 9, batch: 200 // loss: 0.582\n", "epoch: 9, batch: 300 // loss: 0.345\n", "epoch: 9, batch: 400 // loss: 0.220\n", "epoch: 9, batch: 500 // loss: 0.432\n", "epoch: 9, batch: 600 // loss: 0.535\n", "epoch: 9, batch: 700 // loss: 0.257\n", "epoch: 9, batch: 800 // loss: 0.295\n", "epoch: 9, batch: 900 // loss: 0.132\n", "epoch: 9, batch: 1000 // loss: 0.633\n", "epoch: 9, batch: 1100 // loss: 0.154\n", "epoch: 9, batch: 1200 // loss: 0.266\n", "\n", "epoch: 10, batch: 0 // loss: 0.332\n", "epoch: 10, batch: 100 // loss: 0.330\n", "epoch: 10, batch: 200 // loss: 0.571\n", "epoch: 10, batch: 300 // loss: 0.337\n", "epoch: 10, batch: 400 // loss: 0.213\n", "epoch: 10, batch: 500 // loss: 0.429\n", "epoch: 10, batch: 600 // loss: 0.527\n", "epoch: 10, batch: 700 // loss: 0.256\n", "epoch: 10, batch: 800 // loss: 0.291\n", "epoch: 10, batch: 900 // loss: 0.126\n", "epoch: 10, batch: 1000 // loss: 0.627\n", "epoch: 10, batch: 1100 // loss: 0.151\n", "epoch: 10, batch: 1200 // loss: 0.253\n", "\n", "epoch: 11, batch: 0 // loss: 0.323\n", "epoch: 11, batch: 100 // loss: 0.330\n", "epoch: 11, batch: 200 // loss: 0.550\n", "epoch: 11, batch: 300 // loss: 0.328\n", "epoch: 11, batch: 400 // loss: 0.207\n", "epoch: 11, batch: 500 // loss: 0.423\n", "epoch: 11, batch: 600 // loss: 0.517\n", "epoch: 11, batch: 700 // loss: 0.252\n", "epoch: 11, batch: 800 // loss: 0.286\n", "epoch: 11, batch: 900 // loss: 0.122\n", "epoch: 11, batch: 1000 // loss: 0.618\n", "epoch: 11, batch: 1100 // loss: 0.149\n", "epoch: 11, batch: 1200 // loss: 0.245\n", "\n", "epoch: 12, batch: 0 // loss: 0.319\n", "epoch: 12, batch: 100 // loss: 0.330\n", "epoch: 12, batch: 200 // loss: 0.537\n", "epoch: 12, batch: 300 // loss: 0.324\n", "epoch: 12, batch: 400 // loss: 0.200\n", "epoch: 12, batch: 500 // loss: 0.414\n", "epoch: 12, batch: 600 // loss: 0.513\n", "epoch: 12, batch: 700 // loss: 0.251\n", "epoch: 12, batch: 800 // loss: 0.284\n", "epoch: 12, batch: 900 // loss: 0.120\n", "epoch: 12, batch: 1000 // loss: 0.609\n", "epoch: 12, batch: 1100 // loss: 0.147\n", "epoch: 12, batch: 1200 // loss: 0.232\n", "\n", "epoch: 13, batch: 0 // loss: 0.311\n", "epoch: 13, batch: 100 // loss: 0.328\n", "epoch: 13, batch: 200 // loss: 0.523\n", "epoch: 13, batch: 300 // loss: 0.325\n", "epoch: 13, batch: 400 // loss: 0.194\n", "epoch: 13, batch: 500 // loss: 0.409\n", "epoch: 13, batch: 600 // loss: 0.501\n", "epoch: 13, batch: 700 // loss: 0.248\n", "epoch: 13, batch: 800 // loss: 0.281\n", "epoch: 13, batch: 900 // loss: 0.117\n", "epoch: 13, batch: 1000 // loss: 0.603\n", "epoch: 13, batch: 1100 // loss: 0.145\n", "epoch: 13, batch: 1200 // loss: 0.222\n", "\n", "epoch: 14, batch: 0 // loss: 0.307\n", "epoch: 14, batch: 100 // loss: 0.328\n", "epoch: 14, batch: 200 // loss: 0.508\n", "epoch: 14, batch: 300 // loss: 0.322\n", "epoch: 14, batch: 400 // loss: 0.188\n", "epoch: 14, batch: 500 // loss: 0.407\n", "epoch: 14, batch: 600 // loss: 0.490\n", "epoch: 14, batch: 700 // loss: 0.249\n", "epoch: 14, batch: 800 // loss: 0.286\n", "epoch: 14, batch: 900 // loss: 0.112\n", "epoch: 14, batch: 1000 // loss: 0.597\n", "epoch: 14, batch: 1100 // loss: 0.143\n", "epoch: 14, batch: 1200 // loss: 0.215\n", "\n", "epoch: 15, batch: 0 // loss: 0.303\n", "epoch: 15, batch: 100 // loss: 0.326\n", "epoch: 15, batch: 200 // loss: 0.487\n", "epoch: 15, batch: 300 // loss: 0.315\n", "epoch: 15, batch: 400 // loss: 0.184\n", "epoch: 15, batch: 500 // loss: 0.405\n", "epoch: 15, batch: 600 // loss: 0.484\n", "epoch: 15, batch: 700 // loss: 0.250\n", "epoch: 15, batch: 800 // loss: 0.284\n", "epoch: 15, batch: 900 // loss: 0.109\n", "epoch: 15, batch: 1000 // loss: 0.593\n", "epoch: 15, batch: 1100 // loss: 0.139\n", "epoch: 15, batch: 1200 // loss: 0.209\n", "\n", "epoch: 16, batch: 0 // loss: 0.297\n", "epoch: 16, batch: 100 // loss: 0.325\n", "epoch: 16, batch: 200 // loss: 0.476\n", "epoch: 16, batch: 300 // loss: 0.316\n", "epoch: 16, batch: 400 // loss: 0.180\n", "epoch: 16, batch: 500 // loss: 0.406\n", "epoch: 16, batch: 600 // loss: 0.477\n", "epoch: 16, batch: 700 // loss: 0.247\n", "epoch: 16, batch: 800 // loss: 0.287\n", "epoch: 16, batch: 900 // loss: 0.109\n", "epoch: 16, batch: 1000 // loss: 0.590\n", "epoch: 16, batch: 1100 // loss: 0.135\n", "epoch: 16, batch: 1200 // loss: 0.200\n", "\n", "epoch: 17, batch: 0 // loss: 0.294\n", "epoch: 17, batch: 100 // loss: 0.323\n", "epoch: 17, batch: 200 // loss: 0.467\n", "epoch: 17, batch: 300 // loss: 0.314\n", "epoch: 17, batch: 400 // loss: 0.176\n", "epoch: 17, batch: 500 // loss: 0.406\n", "epoch: 17, batch: 600 // loss: 0.471\n", "epoch: 17, batch: 700 // loss: 0.247\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 17, batch: 800 // loss: 0.289\n", "epoch: 17, batch: 900 // loss: 0.106\n", "epoch: 17, batch: 1000 // loss: 0.585\n", "epoch: 17, batch: 1100 // loss: 0.135\n", "epoch: 17, batch: 1200 // loss: 0.198\n", "\n", "epoch: 18, batch: 0 // loss: 0.291\n", "epoch: 18, batch: 100 // loss: 0.325\n", "epoch: 18, batch: 200 // loss: 0.458\n", "epoch: 18, batch: 300 // loss: 0.313\n", "epoch: 18, batch: 400 // loss: 0.173\n", "epoch: 18, batch: 500 // loss: 0.412\n", "epoch: 18, batch: 600 // loss: 0.465\n", "epoch: 18, batch: 700 // loss: 0.245\n", "epoch: 18, batch: 800 // loss: 0.287\n", "epoch: 18, batch: 900 // loss: 0.102\n", "epoch: 18, batch: 1000 // loss: 0.576\n", "epoch: 18, batch: 1100 // loss: 0.133\n", "epoch: 18, batch: 1200 // loss: 0.193\n", "\n", "epoch: 19, batch: 0 // loss: 0.287\n", "epoch: 19, batch: 100 // loss: 0.324\n", "epoch: 19, batch: 200 // loss: 0.450\n", "epoch: 19, batch: 300 // loss: 0.312\n", "epoch: 19, batch: 400 // loss: 0.169\n", "epoch: 19, batch: 500 // loss: 0.418\n", "epoch: 19, batch: 600 // loss: 0.459\n", "epoch: 19, batch: 700 // loss: 0.241\n", "epoch: 19, batch: 800 // loss: 0.281\n", "epoch: 19, batch: 900 // loss: 0.099\n", "epoch: 19, batch: 1000 // loss: 0.569\n", "epoch: 19, batch: 1100 // loss: 0.133\n", "epoch: 19, batch: 1200 // loss: 0.187\n", "\n", "epoch: 20, batch: 0 // loss: 0.287\n", "epoch: 20, batch: 100 // loss: 0.325\n", "epoch: 20, batch: 200 // loss: 0.440\n", "epoch: 20, batch: 300 // loss: 0.309\n", "epoch: 20, batch: 400 // loss: 0.165\n", "epoch: 20, batch: 500 // loss: 0.416\n", "epoch: 20, batch: 600 // loss: 0.453\n", "epoch: 20, batch: 700 // loss: 0.238\n", "epoch: 20, batch: 800 // loss: 0.286\n", "epoch: 20, batch: 900 // loss: 0.096\n", "epoch: 20, batch: 1000 // loss: 0.568\n", "epoch: 20, batch: 1100 // loss: 0.131\n", "epoch: 20, batch: 1200 // loss: 0.185\n", "\n", "epoch: 21, batch: 0 // loss: 0.285\n", "epoch: 21, batch: 100 // loss: 0.324\n", "epoch: 21, batch: 200 // loss: 0.434\n", "epoch: 21, batch: 300 // loss: 0.306\n", "epoch: 21, batch: 400 // loss: 0.162\n", "epoch: 21, batch: 500 // loss: 0.418\n", "epoch: 21, batch: 600 // loss: 0.445\n", "epoch: 21, batch: 700 // loss: 0.237\n", "epoch: 21, batch: 800 // loss: 0.286\n", "epoch: 21, batch: 900 // loss: 0.096\n", "epoch: 21, batch: 1000 // loss: 0.566\n", "epoch: 21, batch: 1100 // loss: 0.130\n", "epoch: 21, batch: 1200 // loss: 0.181\n", "\n", "epoch: 22, batch: 0 // loss: 0.281\n", "epoch: 22, batch: 100 // loss: 0.320\n", "epoch: 22, batch: 200 // loss: 0.422\n", "epoch: 22, batch: 300 // loss: 0.302\n", "epoch: 22, batch: 400 // loss: 0.160\n", "epoch: 22, batch: 500 // loss: 0.420\n", "epoch: 22, batch: 600 // loss: 0.439\n", "epoch: 22, batch: 700 // loss: 0.235\n", "epoch: 22, batch: 800 // loss: 0.294\n", "epoch: 22, batch: 900 // loss: 0.092\n", "epoch: 22, batch: 1000 // loss: 0.565\n", "epoch: 22, batch: 1100 // loss: 0.128\n", "epoch: 22, batch: 1200 // loss: 0.176\n", "\n", "epoch: 23, batch: 0 // loss: 0.285\n", "epoch: 23, batch: 100 // loss: 0.318\n", "epoch: 23, batch: 200 // loss: 0.424\n", "epoch: 23, batch: 300 // loss: 0.298\n", "epoch: 23, batch: 400 // loss: 0.157\n", "epoch: 23, batch: 500 // loss: 0.423\n", "epoch: 23, batch: 600 // loss: 0.436\n", "epoch: 23, batch: 700 // loss: 0.239\n", "epoch: 23, batch: 800 // loss: 0.292\n", "epoch: 23, batch: 900 // loss: 0.091\n", "epoch: 23, batch: 1000 // loss: 0.562\n", "epoch: 23, batch: 1100 // loss: 0.122\n", "epoch: 23, batch: 1200 // loss: 0.172\n", "\n", "epoch: 24, batch: 0 // loss: 0.285\n", "epoch: 24, batch: 100 // loss: 0.310\n", "epoch: 24, batch: 200 // loss: 0.418\n", "epoch: 24, batch: 300 // loss: 0.299\n", "epoch: 24, batch: 400 // loss: 0.154\n", "epoch: 24, batch: 500 // loss: 0.425\n", "epoch: 24, batch: 600 // loss: 0.431\n", "epoch: 24, batch: 700 // loss: 0.228\n", "epoch: 24, batch: 800 // loss: 0.309\n", "epoch: 24, batch: 900 // loss: 0.088\n", "epoch: 24, batch: 1000 // loss: 0.561\n", "epoch: 24, batch: 1100 // loss: 0.121\n", "epoch: 24, batch: 1200 // loss: 0.170\n", "\n", "epoch: 25, batch: 0 // loss: 0.283\n", "epoch: 25, batch: 100 // loss: 0.309\n", "epoch: 25, batch: 200 // loss: 0.409\n", "epoch: 25, batch: 300 // loss: 0.296\n", "epoch: 25, batch: 400 // loss: 0.151\n", "epoch: 25, batch: 500 // loss: 0.425\n", "epoch: 25, batch: 600 // loss: 0.427\n", "epoch: 25, batch: 700 // loss: 0.220\n", "epoch: 25, batch: 800 // loss: 0.311\n", "epoch: 25, batch: 900 // loss: 0.085\n", "epoch: 25, batch: 1000 // loss: 0.559\n", "epoch: 25, batch: 1100 // loss: 0.121\n", "epoch: 25, batch: 1200 // loss: 0.169\n", "\n", "epoch: 26, batch: 0 // loss: 0.286\n", "epoch: 26, batch: 100 // loss: 0.309\n", "epoch: 26, batch: 200 // loss: 0.401\n", "epoch: 26, batch: 300 // loss: 0.291\n", "epoch: 26, batch: 400 // loss: 0.149\n", "epoch: 26, batch: 500 // loss: 0.428\n", "epoch: 26, batch: 600 // loss: 0.423\n", "epoch: 26, batch: 700 // loss: 0.236\n", "epoch: 26, batch: 800 // loss: 0.310\n", "epoch: 26, batch: 900 // loss: 0.084\n", "epoch: 26, batch: 1000 // loss: 0.558\n", "epoch: 26, batch: 1100 // loss: 0.119\n", "epoch: 26, batch: 1200 // loss: 0.166\n", "\n", "epoch: 27, batch: 0 // loss: 0.282\n", "epoch: 27, batch: 100 // loss: 0.310\n", "epoch: 27, batch: 200 // loss: 0.394\n", "epoch: 27, batch: 300 // loss: 0.293\n", "epoch: 27, batch: 400 // loss: 0.146\n", "epoch: 27, batch: 500 // loss: 0.428\n", "epoch: 27, batch: 600 // loss: 0.420\n", "epoch: 27, batch: 700 // loss: 0.242\n", "epoch: 27, batch: 800 // loss: 0.312\n", "epoch: 27, batch: 900 // loss: 0.083\n", "epoch: 27, batch: 1000 // loss: 0.558\n", "epoch: 27, batch: 1100 // loss: 0.118\n", "epoch: 27, batch: 1200 // loss: 0.163\n", "\n", "epoch: 28, batch: 0 // loss: 0.285\n", "epoch: 28, batch: 100 // loss: 0.310\n", "epoch: 28, batch: 200 // loss: 0.389\n", "epoch: 28, batch: 300 // loss: 0.287\n", "epoch: 28, batch: 400 // loss: 0.144\n", "epoch: 28, batch: 500 // loss: 0.429\n", "epoch: 28, batch: 600 // loss: 0.419\n", "epoch: 28, batch: 700 // loss: 0.242\n", "epoch: 28, batch: 800 // loss: 0.310\n", "epoch: 28, batch: 900 // loss: 0.081\n", "epoch: 28, batch: 1000 // loss: 0.551\n", "epoch: 28, batch: 1100 // loss: 0.115\n", "epoch: 28, batch: 1200 // loss: 0.160\n", "\n", "epoch: 29, batch: 0 // loss: 0.282\n", "epoch: 29, batch: 100 // loss: 0.298\n", "epoch: 29, batch: 200 // loss: 0.400\n", "epoch: 29, batch: 300 // loss: 0.283\n", "epoch: 29, batch: 400 // loss: 0.143\n", "epoch: 29, batch: 500 // loss: 0.427\n", "epoch: 29, batch: 600 // loss: 0.420\n", "epoch: 29, batch: 700 // loss: 0.248\n", "epoch: 29, batch: 800 // loss: 0.311\n", "epoch: 29, batch: 900 // loss: 0.080\n", "epoch: 29, batch: 1000 // loss: 0.549\n", "epoch: 29, batch: 1100 // loss: 0.113\n", "epoch: 29, batch: 1200 // loss: 0.157\n", "\n", "epoch: 30, batch: 0 // loss: 0.283\n", "epoch: 30, batch: 100 // loss: 0.294\n", "epoch: 30, batch: 200 // loss: 0.406\n", "epoch: 30, batch: 300 // loss: 0.281\n", "epoch: 30, batch: 400 // loss: 0.141\n", "epoch: 30, batch: 500 // loss: 0.421\n", "epoch: 30, batch: 600 // loss: 0.419\n", "epoch: 30, batch: 700 // loss: 0.250\n", "epoch: 30, batch: 800 // loss: 0.312\n", "epoch: 30, batch: 900 // loss: 0.080\n", "epoch: 30, batch: 1000 // loss: 0.548\n", "epoch: 30, batch: 1100 // loss: 0.114\n", "epoch: 30, batch: 1200 // loss: 0.154\n", "\n", "epoch: 31, batch: 0 // loss: 0.279\n", "epoch: 31, batch: 100 // loss: 0.290\n", "epoch: 31, batch: 200 // loss: 0.401\n", "epoch: 31, batch: 300 // loss: 0.278\n", "epoch: 31, batch: 400 // loss: 0.140\n", "epoch: 31, batch: 500 // loss: 0.418\n", "epoch: 31, batch: 600 // loss: 0.419\n", "epoch: 31, batch: 700 // loss: 0.251\n", "epoch: 31, batch: 800 // loss: 0.313\n", "epoch: 31, batch: 900 // loss: 0.079\n", "epoch: 31, batch: 1000 // loss: 0.544\n", "epoch: 31, batch: 1100 // loss: 0.114\n", "epoch: 31, batch: 1200 // loss: 0.154\n", "\n", "epoch: 32, batch: 0 // loss: 0.281\n", "epoch: 32, batch: 100 // loss: 0.284\n", "epoch: 32, batch: 200 // loss: 0.404\n", "epoch: 32, batch: 300 // loss: 0.277\n", "epoch: 32, batch: 400 // loss: 0.138\n", "epoch: 32, batch: 500 // loss: 0.424\n", "epoch: 32, batch: 600 // loss: 0.419\n", "epoch: 32, batch: 700 // loss: 0.254\n", "epoch: 32, batch: 800 // loss: 0.309\n", "epoch: 32, batch: 900 // loss: 0.077\n", "epoch: 32, batch: 1000 // loss: 0.547\n", "epoch: 32, batch: 1100 // loss: 0.114\n", "epoch: 32, batch: 1200 // loss: 0.151\n", "\n", "epoch: 33, batch: 0 // loss: 0.281\n", "epoch: 33, batch: 100 // loss: 0.287\n", "epoch: 33, batch: 200 // loss: 0.402\n", "epoch: 33, batch: 300 // loss: 0.279\n", "epoch: 33, batch: 400 // loss: 0.137\n", "epoch: 33, batch: 500 // loss: 0.424\n", "epoch: 33, batch: 600 // loss: 0.416\n", "epoch: 33, batch: 700 // loss: 0.254\n", "epoch: 33, batch: 800 // loss: 0.313\n", "epoch: 33, batch: 900 // loss: 0.077\n", "epoch: 33, batch: 1000 // loss: 0.543\n", "epoch: 33, batch: 1100 // loss: 0.116\n", "epoch: 33, batch: 1200 // loss: 0.149\n", "\n", "epoch: 34, batch: 0 // loss: 0.286\n", "epoch: 34, batch: 100 // loss: 0.278\n", "epoch: 34, batch: 200 // loss: 0.394\n", "epoch: 34, batch: 300 // loss: 0.277\n", "epoch: 34, batch: 400 // loss: 0.137\n", "epoch: 34, batch: 500 // loss: 0.429\n", "epoch: 34, batch: 600 // loss: 0.413\n", "epoch: 34, batch: 700 // loss: 0.257\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 34, batch: 800 // loss: 0.309\n", "epoch: 34, batch: 900 // loss: 0.075\n", "epoch: 34, batch: 1000 // loss: 0.539\n", "epoch: 34, batch: 1100 // loss: 0.116\n", "epoch: 34, batch: 1200 // loss: 0.147\n", "\n", "epoch: 35, batch: 0 // loss: 0.279\n", "epoch: 35, batch: 100 // loss: 0.279\n", "epoch: 35, batch: 200 // loss: 0.397\n", "epoch: 35, batch: 300 // loss: 0.277\n", "epoch: 35, batch: 400 // loss: 0.137\n", "epoch: 35, batch: 500 // loss: 0.426\n", "epoch: 35, batch: 600 // loss: 0.409\n", "epoch: 35, batch: 700 // loss: 0.258\n", "epoch: 35, batch: 800 // loss: 0.316\n", "epoch: 35, batch: 900 // loss: 0.075\n", "epoch: 35, batch: 1000 // loss: 0.541\n", "epoch: 35, batch: 1100 // loss: 0.115\n", "epoch: 35, batch: 1200 // loss: 0.145\n", "\n", "epoch: 36, batch: 0 // loss: 0.276\n", "epoch: 36, batch: 100 // loss: 0.274\n", "epoch: 36, batch: 200 // loss: 0.400\n", "epoch: 36, batch: 300 // loss: 0.277\n", "epoch: 36, batch: 400 // loss: 0.136\n", "epoch: 36, batch: 500 // loss: 0.434\n", "epoch: 36, batch: 600 // loss: 0.406\n", "epoch: 36, batch: 700 // loss: 0.259\n", "epoch: 36, batch: 800 // loss: 0.315\n", "epoch: 36, batch: 900 // loss: 0.073\n", "epoch: 36, batch: 1000 // loss: 0.540\n", "epoch: 36, batch: 1100 // loss: 0.115\n", "epoch: 36, batch: 1200 // loss: 0.143\n", "\n", "epoch: 37, batch: 0 // loss: 0.272\n", "epoch: 37, batch: 100 // loss: 0.269\n", "epoch: 37, batch: 200 // loss: 0.386\n", "epoch: 37, batch: 300 // loss: 0.271\n", "epoch: 37, batch: 400 // loss: 0.138\n", "epoch: 37, batch: 500 // loss: 0.432\n", "epoch: 37, batch: 600 // loss: 0.404\n", "epoch: 37, batch: 700 // loss: 0.265\n", "epoch: 37, batch: 800 // loss: 0.309\n", "epoch: 37, batch: 900 // loss: 0.074\n", "epoch: 37, batch: 1000 // loss: 0.534\n", "epoch: 37, batch: 1100 // loss: 0.116\n", "epoch: 37, batch: 1200 // loss: 0.143\n", "\n", "epoch: 38, batch: 0 // loss: 0.272\n", "epoch: 38, batch: 100 // loss: 0.264\n", "epoch: 38, batch: 200 // loss: 0.391\n", "epoch: 38, batch: 300 // loss: 0.269\n", "epoch: 38, batch: 400 // loss: 0.136\n", "epoch: 38, batch: 500 // loss: 0.439\n", "epoch: 38, batch: 600 // loss: 0.402\n", "epoch: 38, batch: 700 // loss: 0.266\n", "epoch: 38, batch: 800 // loss: 0.304\n", "epoch: 38, batch: 900 // loss: 0.072\n", "epoch: 38, batch: 1000 // loss: 0.531\n", "epoch: 38, batch: 1100 // loss: 0.117\n", "epoch: 38, batch: 1200 // loss: 0.140\n", "\n", "epoch: 39, batch: 0 // loss: 0.273\n", "epoch: 39, batch: 100 // loss: 0.260\n", "epoch: 39, batch: 200 // loss: 0.385\n", "epoch: 39, batch: 300 // loss: 0.267\n", "epoch: 39, batch: 400 // loss: 0.137\n", "epoch: 39, batch: 500 // loss: 0.435\n", "epoch: 39, batch: 600 // loss: 0.404\n", "epoch: 39, batch: 700 // loss: 0.269\n", "epoch: 39, batch: 800 // loss: 0.303\n", "epoch: 39, batch: 900 // loss: 0.072\n", "epoch: 39, batch: 1000 // loss: 0.525\n", "epoch: 39, batch: 1100 // loss: 0.118\n", "epoch: 39, batch: 1200 // loss: 0.139\n", "\n", "epoch: 40, batch: 0 // loss: 0.268\n", "epoch: 40, batch: 100 // loss: 0.256\n", "epoch: 40, batch: 200 // loss: 0.383\n", "epoch: 40, batch: 300 // loss: 0.267\n", "epoch: 40, batch: 400 // loss: 0.136\n", "epoch: 40, batch: 500 // loss: 0.433\n", "epoch: 40, batch: 600 // loss: 0.400\n", "epoch: 40, batch: 700 // loss: 0.277\n", "epoch: 40, batch: 800 // loss: 0.299\n", "epoch: 40, batch: 900 // loss: 0.073\n", "epoch: 40, batch: 1000 // loss: 0.524\n", "epoch: 40, batch: 1100 // loss: 0.118\n", "epoch: 40, batch: 1200 // loss: 0.139\n", "\n", "epoch: 41, batch: 0 // loss: 0.268\n", "epoch: 41, batch: 100 // loss: 0.255\n", "epoch: 41, batch: 200 // loss: 0.390\n", "epoch: 41, batch: 300 // loss: 0.267\n", "epoch: 41, batch: 400 // loss: 0.138\n", "epoch: 41, batch: 500 // loss: 0.434\n", "epoch: 41, batch: 600 // loss: 0.396\n", "epoch: 41, batch: 700 // loss: 0.277\n", "epoch: 41, batch: 800 // loss: 0.297\n", "epoch: 41, batch: 900 // loss: 0.070\n", "epoch: 41, batch: 1000 // loss: 0.524\n", "epoch: 41, batch: 1100 // loss: 0.120\n", "epoch: 41, batch: 1200 // loss: 0.137\n", "\n", "epoch: 42, batch: 0 // loss: 0.264\n", "epoch: 42, batch: 100 // loss: 0.252\n", "epoch: 42, batch: 200 // loss: 0.388\n", "epoch: 42, batch: 300 // loss: 0.263\n", "epoch: 42, batch: 400 // loss: 0.139\n", "epoch: 42, batch: 500 // loss: 0.431\n", "epoch: 42, batch: 600 // loss: 0.400\n", "epoch: 42, batch: 700 // loss: 0.277\n", "epoch: 42, batch: 800 // loss: 0.294\n", "epoch: 42, batch: 900 // loss: 0.070\n", "epoch: 42, batch: 1000 // loss: 0.530\n", "epoch: 42, batch: 1100 // loss: 0.125\n", "epoch: 42, batch: 1200 // loss: 0.137\n", "\n", "epoch: 43, batch: 0 // loss: 0.259\n", "epoch: 43, batch: 100 // loss: 0.247\n", "epoch: 43, batch: 200 // loss: 0.382\n", "epoch: 43, batch: 300 // loss: 0.264\n", "epoch: 43, batch: 400 // loss: 0.138\n", "epoch: 43, batch: 500 // loss: 0.437\n", "epoch: 43, batch: 600 // loss: 0.403\n", "epoch: 43, batch: 700 // loss: 0.267\n", "epoch: 43, batch: 800 // loss: 0.301\n", "epoch: 43, batch: 900 // loss: 0.068\n", "epoch: 43, batch: 1000 // loss: 0.525\n", "epoch: 43, batch: 1100 // loss: 0.124\n", "epoch: 43, batch: 1200 // loss: 0.139\n", "\n", "epoch: 44, batch: 0 // loss: 0.258\n", "epoch: 44, batch: 100 // loss: 0.245\n", "epoch: 44, batch: 200 // loss: 0.384\n", "epoch: 44, batch: 300 // loss: 0.261\n", "epoch: 44, batch: 400 // loss: 0.138\n", "epoch: 44, batch: 500 // loss: 0.434\n", "epoch: 44, batch: 600 // loss: 0.404\n", "epoch: 44, batch: 700 // loss: 0.267\n", "epoch: 44, batch: 800 // loss: 0.292\n", "epoch: 44, batch: 900 // loss: 0.072\n", "epoch: 44, batch: 1000 // loss: 0.528\n", "epoch: 44, batch: 1100 // loss: 0.126\n", "epoch: 44, batch: 1200 // loss: 0.137\n", "\n", "epoch: 45, batch: 0 // loss: 0.254\n", "epoch: 45, batch: 100 // loss: 0.243\n", "epoch: 45, batch: 200 // loss: 0.371\n", "epoch: 45, batch: 300 // loss: 0.257\n", "epoch: 45, batch: 400 // loss: 0.137\n", "epoch: 45, batch: 500 // loss: 0.436\n", "epoch: 45, batch: 600 // loss: 0.404\n", "epoch: 45, batch: 700 // loss: 0.269\n", "epoch: 45, batch: 800 // loss: 0.286\n", "epoch: 45, batch: 900 // loss: 0.069\n", "epoch: 45, batch: 1000 // loss: 0.531\n", "epoch: 45, batch: 1100 // loss: 0.124\n", "epoch: 45, batch: 1200 // loss: 0.138\n", "\n", "epoch: 46, batch: 0 // loss: 0.248\n", "epoch: 46, batch: 100 // loss: 0.243\n", "epoch: 46, batch: 200 // loss: 0.372\n", "epoch: 46, batch: 300 // loss: 0.257\n", "epoch: 46, batch: 400 // loss: 0.137\n", "epoch: 46, batch: 500 // loss: 0.440\n", "epoch: 46, batch: 600 // loss: 0.406\n", "epoch: 46, batch: 700 // loss: 0.262\n", "epoch: 46, batch: 800 // loss: 0.285\n", "epoch: 46, batch: 900 // loss: 0.070\n", "epoch: 46, batch: 1000 // loss: 0.531\n", "epoch: 46, batch: 1100 // loss: 0.127\n", "epoch: 46, batch: 1200 // loss: 0.140\n", "\n", "epoch: 47, batch: 0 // loss: 0.247\n", "epoch: 47, batch: 100 // loss: 0.243\n", "epoch: 47, batch: 200 // loss: 0.366\n", "epoch: 47, batch: 300 // loss: 0.255\n", "epoch: 47, batch: 400 // loss: 0.137\n", "epoch: 47, batch: 500 // loss: 0.438\n", "epoch: 47, batch: 600 // loss: 0.407\n", "epoch: 47, batch: 700 // loss: 0.263\n", "epoch: 47, batch: 800 // loss: 0.284\n", "epoch: 47, batch: 900 // loss: 0.068\n", "epoch: 47, batch: 1000 // loss: 0.531\n", "epoch: 47, batch: 1100 // loss: 0.127\n", "epoch: 47, batch: 1200 // loss: 0.140\n", "\n", "epoch: 48, batch: 0 // loss: 0.243\n", "epoch: 48, batch: 100 // loss: 0.243\n", "epoch: 48, batch: 200 // loss: 0.361\n", "epoch: 48, batch: 300 // loss: 0.250\n", "epoch: 48, batch: 400 // loss: 0.136\n", "epoch: 48, batch: 500 // loss: 0.440\n", "epoch: 48, batch: 600 // loss: 0.410\n", "epoch: 48, batch: 700 // loss: 0.268\n", "epoch: 48, batch: 800 // loss: 0.279\n", "epoch: 48, batch: 900 // loss: 0.065\n", "epoch: 48, batch: 1000 // loss: 0.528\n", "epoch: 48, batch: 1100 // loss: 0.129\n", "epoch: 48, batch: 1200 // loss: 0.132\n", "\n", "epoch: 49, batch: 0 // loss: 0.239\n", "epoch: 49, batch: 100 // loss: 0.240\n", "epoch: 49, batch: 200 // loss: 0.361\n", "epoch: 49, batch: 300 // loss: 0.253\n", "epoch: 49, batch: 400 // loss: 0.135\n", "epoch: 49, batch: 500 // loss: 0.439\n", "epoch: 49, batch: 600 // loss: 0.411\n", "epoch: 49, batch: 700 // loss: 0.271\n", "epoch: 49, batch: 800 // loss: 0.271\n", "epoch: 49, batch: 900 // loss: 0.066\n", "epoch: 49, batch: 1000 // loss: 0.527\n", "epoch: 49, batch: 1100 // loss: 0.130\n", "epoch: 49, batch: 1200 // loss: 0.132\n", "\n", "epoch: 50, batch: 0 // loss: 0.231\n", "epoch: 50, batch: 100 // loss: 0.237\n", "epoch: 50, batch: 200 // loss: 0.363\n", "epoch: 50, batch: 300 // loss: 0.245\n", "epoch: 50, batch: 400 // loss: 0.135\n", "epoch: 50, batch: 500 // loss: 0.444\n", "epoch: 50, batch: 600 // loss: 0.409\n", "epoch: 50, batch: 700 // loss: 0.269\n", "epoch: 50, batch: 800 // loss: 0.269\n", "epoch: 50, batch: 900 // loss: 0.065\n", "epoch: 50, batch: 1000 // loss: 0.525\n", "epoch: 50, batch: 1100 // loss: 0.130\n", "epoch: 50, batch: 1200 // loss: 0.136\n", "\n", "epoch: 51, batch: 0 // loss: 0.231\n", "epoch: 51, batch: 100 // loss: 0.233\n", "epoch: 51, batch: 200 // loss: 0.350\n", "epoch: 51, batch: 300 // loss: 0.243\n", "epoch: 51, batch: 400 // loss: 0.135\n", "epoch: 51, batch: 500 // loss: 0.444\n", "epoch: 51, batch: 600 // loss: 0.408\n", "epoch: 51, batch: 700 // loss: 0.266\n", "epoch: 51, batch: 800 // loss: 0.269\n", "epoch: 51, batch: 900 // loss: 0.064\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 51, batch: 1000 // loss: 0.524\n", "epoch: 51, batch: 1100 // loss: 0.131\n", "epoch: 51, batch: 1200 // loss: 0.130\n", "\n", "epoch: 52, batch: 0 // loss: 0.225\n", "epoch: 52, batch: 100 // loss: 0.232\n", "epoch: 52, batch: 200 // loss: 0.349\n", "epoch: 52, batch: 300 // loss: 0.243\n", "epoch: 52, batch: 400 // loss: 0.135\n", "epoch: 52, batch: 500 // loss: 0.443\n", "epoch: 52, batch: 600 // loss: 0.404\n", "epoch: 52, batch: 700 // loss: 0.268\n", "epoch: 52, batch: 800 // loss: 0.264\n", "epoch: 52, batch: 900 // loss: 0.064\n", "epoch: 52, batch: 1000 // loss: 0.522\n", "epoch: 52, batch: 1100 // loss: 0.133\n", "epoch: 52, batch: 1200 // loss: 0.137\n", "\n", "epoch: 53, batch: 0 // loss: 0.224\n", "epoch: 53, batch: 100 // loss: 0.225\n", "epoch: 53, batch: 200 // loss: 0.341\n", "epoch: 53, batch: 300 // loss: 0.236\n", "epoch: 53, batch: 400 // loss: 0.135\n", "epoch: 53, batch: 500 // loss: 0.448\n", "epoch: 53, batch: 600 // loss: 0.403\n", "epoch: 53, batch: 700 // loss: 0.266\n", "epoch: 53, batch: 800 // loss: 0.259\n", "epoch: 53, batch: 900 // loss: 0.064\n", "epoch: 53, batch: 1000 // loss: 0.526\n", "epoch: 53, batch: 1100 // loss: 0.133\n", "epoch: 53, batch: 1200 // loss: 0.134\n", "\n", "epoch: 54, batch: 0 // loss: 0.220\n", "epoch: 54, batch: 100 // loss: 0.222\n", "epoch: 54, batch: 200 // loss: 0.352\n", "epoch: 54, batch: 300 // loss: 0.241\n", "epoch: 54, batch: 400 // loss: 0.131\n", "epoch: 54, batch: 500 // loss: 0.440\n", "epoch: 54, batch: 600 // loss: 0.401\n", "epoch: 54, batch: 700 // loss: 0.273\n", "epoch: 54, batch: 800 // loss: 0.257\n", "epoch: 54, batch: 900 // loss: 0.063\n", "epoch: 54, batch: 1000 // loss: 0.527\n", "epoch: 54, batch: 1100 // loss: 0.134\n", "epoch: 54, batch: 1200 // loss: 0.134\n", "\n", "epoch: 55, batch: 0 // loss: 0.220\n", "epoch: 55, batch: 100 // loss: 0.226\n", "epoch: 55, batch: 200 // loss: 0.347\n", "epoch: 55, batch: 300 // loss: 0.240\n", "epoch: 55, batch: 400 // loss: 0.131\n", "epoch: 55, batch: 500 // loss: 0.451\n", "epoch: 55, batch: 600 // loss: 0.402\n", "epoch: 55, batch: 700 // loss: 0.268\n", "epoch: 55, batch: 800 // loss: 0.256\n", "epoch: 55, batch: 900 // loss: 0.064\n", "epoch: 55, batch: 1000 // loss: 0.526\n", "epoch: 55, batch: 1100 // loss: 0.131\n", "epoch: 55, batch: 1200 // loss: 0.134\n", "\n", "epoch: 56, batch: 0 // loss: 0.218\n", "epoch: 56, batch: 100 // loss: 0.220\n", "epoch: 56, batch: 200 // loss: 0.343\n", "epoch: 56, batch: 300 // loss: 0.234\n", "epoch: 56, batch: 400 // loss: 0.132\n", "epoch: 56, batch: 500 // loss: 0.451\n", "epoch: 56, batch: 600 // loss: 0.400\n", "epoch: 56, batch: 700 // loss: 0.260\n", "epoch: 56, batch: 800 // loss: 0.250\n", "epoch: 56, batch: 900 // loss: 0.063\n", "epoch: 56, batch: 1000 // loss: 0.528\n", "epoch: 56, batch: 1100 // loss: 0.135\n", "epoch: 56, batch: 1200 // loss: 0.133\n", "\n", "epoch: 57, batch: 0 // loss: 0.217\n", "epoch: 57, batch: 100 // loss: 0.219\n", "epoch: 57, batch: 200 // loss: 0.343\n", "epoch: 57, batch: 300 // loss: 0.235\n", "epoch: 57, batch: 400 // loss: 0.131\n", "epoch: 57, batch: 500 // loss: 0.443\n", "epoch: 57, batch: 600 // loss: 0.396\n", "epoch: 57, batch: 700 // loss: 0.261\n", "epoch: 57, batch: 800 // loss: 0.242\n", "epoch: 57, batch: 900 // loss: 0.063\n", "epoch: 57, batch: 1000 // loss: 0.524\n", "epoch: 57, batch: 1100 // loss: 0.134\n", "epoch: 57, batch: 1200 // loss: 0.130\n", "\n", "epoch: 58, batch: 0 // loss: 0.217\n", "epoch: 58, batch: 100 // loss: 0.220\n", "epoch: 58, batch: 200 // loss: 0.348\n", "epoch: 58, batch: 300 // loss: 0.233\n", "epoch: 58, batch: 400 // loss: 0.131\n", "epoch: 58, batch: 500 // loss: 0.446\n", "epoch: 58, batch: 600 // loss: 0.398\n", "epoch: 58, batch: 700 // loss: 0.258\n", "epoch: 58, batch: 800 // loss: 0.245\n", "epoch: 58, batch: 900 // loss: 0.063\n", "epoch: 58, batch: 1000 // loss: 0.525\n", "epoch: 58, batch: 1100 // loss: 0.133\n", "epoch: 58, batch: 1200 // loss: 0.130\n", "\n", "epoch: 59, batch: 0 // loss: 0.218\n", "epoch: 59, batch: 100 // loss: 0.215\n", "epoch: 59, batch: 200 // loss: 0.345\n", "epoch: 59, batch: 300 // loss: 0.233\n", "epoch: 59, batch: 400 // loss: 0.131\n", "epoch: 59, batch: 500 // loss: 0.445\n", "epoch: 59, batch: 600 // loss: 0.399\n", "epoch: 59, batch: 700 // loss: 0.256\n", "epoch: 59, batch: 800 // loss: 0.237\n", "epoch: 59, batch: 900 // loss: 0.064\n", "epoch: 59, batch: 1000 // loss: 0.529\n", "epoch: 59, batch: 1100 // loss: 0.142\n", "epoch: 59, batch: 1200 // loss: 0.127\n", "\n", "epoch: 60, batch: 0 // loss: 0.211\n", "epoch: 60, batch: 100 // loss: 0.217\n", "epoch: 60, batch: 200 // loss: 0.335\n", "epoch: 60, batch: 300 // loss: 0.233\n", "epoch: 60, batch: 400 // loss: 0.130\n", "epoch: 60, batch: 500 // loss: 0.450\n", "epoch: 60, batch: 600 // loss: 0.397\n", "epoch: 60, batch: 700 // loss: 0.255\n", "epoch: 60, batch: 800 // loss: 0.235\n", "epoch: 60, batch: 900 // loss: 0.063\n", "epoch: 60, batch: 1000 // loss: 0.522\n", "epoch: 60, batch: 1100 // loss: 0.139\n", "epoch: 60, batch: 1200 // loss: 0.130\n", "\n", "epoch: 61, batch: 0 // loss: 0.208\n", "epoch: 61, batch: 100 // loss: 0.220\n", "epoch: 61, batch: 200 // loss: 0.329\n", "epoch: 61, batch: 300 // loss: 0.229\n", "epoch: 61, batch: 400 // loss: 0.132\n", "epoch: 61, batch: 500 // loss: 0.449\n", "epoch: 61, batch: 600 // loss: 0.394\n", "epoch: 61, batch: 700 // loss: 0.253\n", "epoch: 61, batch: 800 // loss: 0.229\n", "epoch: 61, batch: 900 // loss: 0.062\n", "epoch: 61, batch: 1000 // loss: 0.523\n", "epoch: 61, batch: 1100 // loss: 0.139\n", "epoch: 61, batch: 1200 // loss: 0.127\n", "\n", "epoch: 62, batch: 0 // loss: 0.204\n", "epoch: 62, batch: 100 // loss: 0.215\n", "epoch: 62, batch: 200 // loss: 0.331\n", "epoch: 62, batch: 300 // loss: 0.229\n", "epoch: 62, batch: 400 // loss: 0.131\n", "epoch: 62, batch: 500 // loss: 0.449\n", "epoch: 62, batch: 600 // loss: 0.391\n", "epoch: 62, batch: 700 // loss: 0.251\n", "epoch: 62, batch: 800 // loss: 0.226\n", "epoch: 62, batch: 900 // loss: 0.062\n", "epoch: 62, batch: 1000 // loss: 0.522\n", "epoch: 62, batch: 1100 // loss: 0.141\n", "epoch: 62, batch: 1200 // loss: 0.129\n", "\n", "epoch: 63, batch: 0 // loss: 0.207\n", "epoch: 63, batch: 100 // loss: 0.215\n", "epoch: 63, batch: 200 // loss: 0.323\n", "epoch: 63, batch: 300 // loss: 0.230\n", "epoch: 63, batch: 400 // loss: 0.130\n", "epoch: 63, batch: 500 // loss: 0.455\n", "epoch: 63, batch: 600 // loss: 0.391\n", "epoch: 63, batch: 700 // loss: 0.245\n", "epoch: 63, batch: 800 // loss: 0.224\n", "epoch: 63, batch: 900 // loss: 0.060\n", "epoch: 63, batch: 1000 // loss: 0.520\n", "epoch: 63, batch: 1100 // loss: 0.140\n", "epoch: 63, batch: 1200 // loss: 0.127\n", "\n", "epoch: 64, batch: 0 // loss: 0.206\n", "epoch: 64, batch: 100 // loss: 0.211\n", "epoch: 64, batch: 200 // loss: 0.316\n", "epoch: 64, batch: 300 // loss: 0.224\n", "epoch: 64, batch: 400 // loss: 0.132\n", "epoch: 64, batch: 500 // loss: 0.453\n", "epoch: 64, batch: 600 // loss: 0.388\n", "epoch: 64, batch: 700 // loss: 0.244\n", "epoch: 64, batch: 800 // loss: 0.219\n", "epoch: 64, batch: 900 // loss: 0.059\n", "epoch: 64, batch: 1000 // loss: 0.506\n", "epoch: 64, batch: 1100 // loss: 0.140\n", "epoch: 64, batch: 1200 // loss: 0.127\n", "\n", "epoch: 65, batch: 0 // loss: 0.202\n", "epoch: 65, batch: 100 // loss: 0.211\n", "epoch: 65, batch: 200 // loss: 0.308\n", "epoch: 65, batch: 300 // loss: 0.226\n", "epoch: 65, batch: 400 // loss: 0.131\n", "epoch: 65, batch: 500 // loss: 0.453\n", "epoch: 65, batch: 600 // loss: 0.385\n", "epoch: 65, batch: 700 // loss: 0.245\n", "epoch: 65, batch: 800 // loss: 0.219\n", "epoch: 65, batch: 900 // loss: 0.059\n", "epoch: 65, batch: 1000 // loss: 0.518\n", "epoch: 65, batch: 1100 // loss: 0.142\n", "epoch: 65, batch: 1200 // loss: 0.128\n", "\n", "epoch: 66, batch: 0 // loss: 0.203\n", "epoch: 66, batch: 100 // loss: 0.205\n", "epoch: 66, batch: 200 // loss: 0.305\n", "epoch: 66, batch: 300 // loss: 0.226\n", "epoch: 66, batch: 400 // loss: 0.130\n", "epoch: 66, batch: 500 // loss: 0.443\n", "epoch: 66, batch: 600 // loss: 0.383\n", "epoch: 66, batch: 700 // loss: 0.242\n", "epoch: 66, batch: 800 // loss: 0.215\n", "epoch: 66, batch: 900 // loss: 0.058\n", "epoch: 66, batch: 1000 // loss: 0.509\n", "epoch: 66, batch: 1100 // loss: 0.140\n", "epoch: 66, batch: 1200 // loss: 0.130\n", "\n", "epoch: 67, batch: 0 // loss: 0.201\n", "epoch: 67, batch: 100 // loss: 0.210\n", "epoch: 67, batch: 200 // loss: 0.303\n", "epoch: 67, batch: 300 // loss: 0.223\n", "epoch: 67, batch: 400 // loss: 0.129\n", "epoch: 67, batch: 500 // loss: 0.439\n", "epoch: 67, batch: 600 // loss: 0.379\n", "epoch: 67, batch: 700 // loss: 0.237\n", "epoch: 67, batch: 800 // loss: 0.207\n", "epoch: 67, batch: 900 // loss: 0.057\n", "epoch: 67, batch: 1000 // loss: 0.505\n", "epoch: 67, batch: 1100 // loss: 0.140\n", "epoch: 67, batch: 1200 // loss: 0.125\n", "\n", "epoch: 68, batch: 0 // loss: 0.202\n", "epoch: 68, batch: 100 // loss: 0.210\n", "epoch: 68, batch: 200 // loss: 0.297\n", "epoch: 68, batch: 300 // loss: 0.218\n", "epoch: 68, batch: 400 // loss: 0.130\n", "epoch: 68, batch: 500 // loss: 0.439\n", "epoch: 68, batch: 600 // loss: 0.378\n", "epoch: 68, batch: 700 // loss: 0.245\n", "epoch: 68, batch: 800 // loss: 0.208\n", "epoch: 68, batch: 900 // loss: 0.058\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 68, batch: 1000 // loss: 0.504\n", "epoch: 68, batch: 1100 // loss: 0.140\n", "epoch: 68, batch: 1200 // loss: 0.126\n", "\n", "epoch: 69, batch: 0 // loss: 0.197\n", "epoch: 69, batch: 100 // loss: 0.205\n", "epoch: 69, batch: 200 // loss: 0.295\n", "epoch: 69, batch: 300 // loss: 0.221\n", "epoch: 69, batch: 400 // loss: 0.133\n", "epoch: 69, batch: 500 // loss: 0.441\n", "epoch: 69, batch: 600 // loss: 0.377\n", "epoch: 69, batch: 700 // loss: 0.235\n", "epoch: 69, batch: 800 // loss: 0.202\n", "epoch: 69, batch: 900 // loss: 0.057\n", "epoch: 69, batch: 1000 // loss: 0.499\n", "epoch: 69, batch: 1100 // loss: 0.140\n", "epoch: 69, batch: 1200 // loss: 0.127\n", "\n", "epoch: 70, batch: 0 // loss: 0.199\n", "epoch: 70, batch: 100 // loss: 0.204\n", "epoch: 70, batch: 200 // loss: 0.289\n", "epoch: 70, batch: 300 // loss: 0.228\n", "epoch: 70, batch: 400 // loss: 0.133\n", "epoch: 70, batch: 500 // loss: 0.440\n", "epoch: 70, batch: 600 // loss: 0.372\n", "epoch: 70, batch: 700 // loss: 0.236\n", "epoch: 70, batch: 800 // loss: 0.205\n", "epoch: 70, batch: 900 // loss: 0.057\n", "epoch: 70, batch: 1000 // loss: 0.507\n", "epoch: 70, batch: 1100 // loss: 0.137\n", "epoch: 70, batch: 1200 // loss: 0.127\n", "\n", "epoch: 71, batch: 0 // loss: 0.198\n", "epoch: 71, batch: 100 // loss: 0.199\n", "epoch: 71, batch: 200 // loss: 0.278\n", "epoch: 71, batch: 300 // loss: 0.218\n", "epoch: 71, batch: 400 // loss: 0.133\n", "epoch: 71, batch: 500 // loss: 0.441\n", "epoch: 71, batch: 600 // loss: 0.370\n", "epoch: 71, batch: 700 // loss: 0.238\n", "epoch: 71, batch: 800 // loss: 0.204\n", "epoch: 71, batch: 900 // loss: 0.056\n", "epoch: 71, batch: 1000 // loss: 0.511\n", "epoch: 71, batch: 1100 // loss: 0.137\n", "epoch: 71, batch: 1200 // loss: 0.123\n", "\n", "epoch: 72, batch: 0 // loss: 0.197\n", "epoch: 72, batch: 100 // loss: 0.197\n", "epoch: 72, batch: 200 // loss: 0.274\n", "epoch: 72, batch: 300 // loss: 0.215\n", "epoch: 72, batch: 400 // loss: 0.133\n", "epoch: 72, batch: 500 // loss: 0.426\n", "epoch: 72, batch: 600 // loss: 0.366\n", "epoch: 72, batch: 700 // loss: 0.238\n", "epoch: 72, batch: 800 // loss: 0.196\n", "epoch: 72, batch: 900 // loss: 0.057\n", "epoch: 72, batch: 1000 // loss: 0.493\n", "epoch: 72, batch: 1100 // loss: 0.139\n", "epoch: 72, batch: 1200 // loss: 0.125\n", "\n", "epoch: 73, batch: 0 // loss: 0.198\n", "epoch: 73, batch: 100 // loss: 0.199\n", "epoch: 73, batch: 200 // loss: 0.273\n", "epoch: 73, batch: 300 // loss: 0.213\n", "epoch: 73, batch: 400 // loss: 0.133\n", "epoch: 73, batch: 500 // loss: 0.421\n", "epoch: 73, batch: 600 // loss: 0.365\n", "epoch: 73, batch: 700 // loss: 0.240\n", "epoch: 73, batch: 800 // loss: 0.196\n", "epoch: 73, batch: 900 // loss: 0.058\n", "epoch: 73, batch: 1000 // loss: 0.507\n", "epoch: 73, batch: 1100 // loss: 0.137\n", "epoch: 73, batch: 1200 // loss: 0.123\n", "\n", "epoch: 74, batch: 0 // loss: 0.197\n", "epoch: 74, batch: 100 // loss: 0.196\n", "epoch: 74, batch: 200 // loss: 0.262\n", "epoch: 74, batch: 300 // loss: 0.214\n", "epoch: 74, batch: 400 // loss: 0.131\n", "epoch: 74, batch: 500 // loss: 0.422\n", "epoch: 74, batch: 600 // loss: 0.359\n", "epoch: 74, batch: 700 // loss: 0.235\n", "epoch: 74, batch: 800 // loss: 0.197\n", "epoch: 74, batch: 900 // loss: 0.057\n", "epoch: 74, batch: 1000 // loss: 0.490\n", "epoch: 74, batch: 1100 // loss: 0.139\n", "epoch: 74, batch: 1200 // loss: 0.125\n", "\n", "epoch: 75, batch: 0 // loss: 0.194\n", "epoch: 75, batch: 100 // loss: 0.193\n", "epoch: 75, batch: 200 // loss: 0.263\n", "epoch: 75, batch: 300 // loss: 0.209\n", "epoch: 75, batch: 400 // loss: 0.132\n", "epoch: 75, batch: 500 // loss: 0.414\n", "epoch: 75, batch: 600 // loss: 0.362\n", "epoch: 75, batch: 700 // loss: 0.239\n", "epoch: 75, batch: 800 // loss: 0.197\n", "epoch: 75, batch: 900 // loss: 0.058\n", "epoch: 75, batch: 1000 // loss: 0.506\n", "epoch: 75, batch: 1100 // loss: 0.131\n", "epoch: 75, batch: 1200 // loss: 0.124\n", "\n", "epoch: 76, batch: 0 // loss: 0.189\n", "epoch: 76, batch: 100 // loss: 0.193\n", "epoch: 76, batch: 200 // loss: 0.262\n", "epoch: 76, batch: 300 // loss: 0.213\n", "epoch: 76, batch: 400 // loss: 0.132\n", "epoch: 76, batch: 500 // loss: 0.418\n", "epoch: 76, batch: 600 // loss: 0.359\n", "epoch: 76, batch: 700 // loss: 0.232\n", "epoch: 76, batch: 800 // loss: 0.193\n", "epoch: 76, batch: 900 // loss: 0.057\n", "epoch: 76, batch: 1000 // loss: 0.490\n", "epoch: 76, batch: 1100 // loss: 0.137\n", "epoch: 76, batch: 1200 // loss: 0.122\n", "\n", "epoch: 77, batch: 0 // loss: 0.192\n", "epoch: 77, batch: 100 // loss: 0.195\n", "epoch: 77, batch: 200 // loss: 0.259\n", "epoch: 77, batch: 300 // loss: 0.209\n", "epoch: 77, batch: 400 // loss: 0.136\n", "epoch: 77, batch: 500 // loss: 0.421\n", "epoch: 77, batch: 600 // loss: 0.355\n", "epoch: 77, batch: 700 // loss: 0.235\n", "epoch: 77, batch: 800 // loss: 0.194\n", "epoch: 77, batch: 900 // loss: 0.059\n", "epoch: 77, batch: 1000 // loss: 0.507\n", "epoch: 77, batch: 1100 // loss: 0.133\n", "epoch: 77, batch: 1200 // loss: 0.121\n", "\n", "epoch: 78, batch: 0 // loss: 0.186\n", "epoch: 78, batch: 100 // loss: 0.191\n", "epoch: 78, batch: 200 // loss: 0.258\n", "epoch: 78, batch: 300 // loss: 0.210\n", "epoch: 78, batch: 400 // loss: 0.135\n", "epoch: 78, batch: 500 // loss: 0.414\n", "epoch: 78, batch: 600 // loss: 0.354\n", "epoch: 78, batch: 700 // loss: 0.233\n", "epoch: 78, batch: 800 // loss: 0.190\n", "epoch: 78, batch: 900 // loss: 0.060\n", "epoch: 78, batch: 1000 // loss: 0.503\n", "epoch: 78, batch: 1100 // loss: 0.139\n", "epoch: 78, batch: 1200 // loss: 0.123\n", "\n", "epoch: 79, batch: 0 // loss: 0.187\n", "epoch: 79, batch: 100 // loss: 0.187\n", "epoch: 79, batch: 200 // loss: 0.252\n", "epoch: 79, batch: 300 // loss: 0.213\n", "epoch: 79, batch: 400 // loss: 0.136\n", "epoch: 79, batch: 500 // loss: 0.417\n", "epoch: 79, batch: 600 // loss: 0.351\n", "epoch: 79, batch: 700 // loss: 0.229\n", "epoch: 79, batch: 800 // loss: 0.191\n", "epoch: 79, batch: 900 // loss: 0.061\n", "epoch: 79, batch: 1000 // loss: 0.501\n", "epoch: 79, batch: 1100 // loss: 0.133\n", "epoch: 79, batch: 1200 // loss: 0.124\n", "\n", "epoch: 80, batch: 0 // loss: 0.191\n", "epoch: 80, batch: 100 // loss: 0.189\n", "epoch: 80, batch: 200 // loss: 0.245\n", "epoch: 80, batch: 300 // loss: 0.213\n", "epoch: 80, batch: 400 // loss: 0.137\n", "epoch: 80, batch: 500 // loss: 0.412\n", "epoch: 80, batch: 600 // loss: 0.348\n", "epoch: 80, batch: 700 // loss: 0.226\n", "epoch: 80, batch: 800 // loss: 0.189\n", "epoch: 80, batch: 900 // loss: 0.061\n", "epoch: 80, batch: 1000 // loss: 0.484\n", "epoch: 80, batch: 1100 // loss: 0.137\n", "epoch: 80, batch: 1200 // loss: 0.126\n", "\n", "epoch: 81, batch: 0 // loss: 0.189\n", "epoch: 81, batch: 100 // loss: 0.184\n", "epoch: 81, batch: 200 // loss: 0.251\n", "epoch: 81, batch: 300 // loss: 0.211\n", "epoch: 81, batch: 400 // loss: 0.135\n", "epoch: 81, batch: 500 // loss: 0.410\n", "epoch: 81, batch: 600 // loss: 0.341\n", "epoch: 81, batch: 700 // loss: 0.224\n", "epoch: 81, batch: 800 // loss: 0.181\n", "epoch: 81, batch: 900 // loss: 0.063\n", "epoch: 81, batch: 1000 // loss: 0.477\n", "epoch: 81, batch: 1100 // loss: 0.134\n", "epoch: 81, batch: 1200 // loss: 0.127\n", "\n", "epoch: 82, batch: 0 // loss: 0.185\n", "epoch: 82, batch: 100 // loss: 0.182\n", "epoch: 82, batch: 200 // loss: 0.249\n", "epoch: 82, batch: 300 // loss: 0.206\n", "epoch: 82, batch: 400 // loss: 0.137\n", "epoch: 82, batch: 500 // loss: 0.402\n", "epoch: 82, batch: 600 // loss: 0.342\n", "epoch: 82, batch: 700 // loss: 0.220\n", "epoch: 82, batch: 800 // loss: 0.182\n", "epoch: 82, batch: 900 // loss: 0.063\n", "epoch: 82, batch: 1000 // loss: 0.494\n", "epoch: 82, batch: 1100 // loss: 0.137\n", "epoch: 82, batch: 1200 // loss: 0.121\n", "\n", "epoch: 83, batch: 0 // loss: 0.189\n", "epoch: 83, batch: 100 // loss: 0.176\n", "epoch: 83, batch: 200 // loss: 0.249\n", "epoch: 83, batch: 300 // loss: 0.204\n", "epoch: 83, batch: 400 // loss: 0.137\n", "epoch: 83, batch: 500 // loss: 0.400\n", "epoch: 83, batch: 600 // loss: 0.332\n", "epoch: 83, batch: 700 // loss: 0.220\n", "epoch: 83, batch: 800 // loss: 0.177\n", "epoch: 83, batch: 900 // loss: 0.064\n", "epoch: 83, batch: 1000 // loss: 0.487\n", "epoch: 83, batch: 1100 // loss: 0.129\n", "epoch: 83, batch: 1200 // loss: 0.121\n", "\n", "epoch: 84, batch: 0 // loss: 0.188\n", "epoch: 84, batch: 100 // loss: 0.177\n", "epoch: 84, batch: 200 // loss: 0.239\n", "epoch: 84, batch: 300 // loss: 0.202\n", "epoch: 84, batch: 400 // loss: 0.137\n", "epoch: 84, batch: 500 // loss: 0.405\n", "epoch: 84, batch: 600 // loss: 0.330\n", "epoch: 84, batch: 700 // loss: 0.216\n", "epoch: 84, batch: 800 // loss: 0.176\n", "epoch: 84, batch: 900 // loss: 0.064\n", "epoch: 84, batch: 1000 // loss: 0.488\n", "epoch: 84, batch: 1100 // loss: 0.136\n", "epoch: 84, batch: 1200 // loss: 0.122\n", "\n", "epoch: 85, batch: 0 // loss: 0.185\n", "epoch: 85, batch: 100 // loss: 0.175\n", "epoch: 85, batch: 200 // loss: 0.241\n", "epoch: 85, batch: 300 // loss: 0.207\n", "epoch: 85, batch: 400 // loss: 0.139\n", "epoch: 85, batch: 500 // loss: 0.398\n", "epoch: 85, batch: 600 // loss: 0.325\n", "epoch: 85, batch: 700 // loss: 0.219\n", "epoch: 85, batch: 800 // loss: 0.170\n", "epoch: 85, batch: 900 // loss: 0.067\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 85, batch: 1000 // loss: 0.471\n", "epoch: 85, batch: 1100 // loss: 0.138\n", "epoch: 85, batch: 1200 // loss: 0.123\n", "\n", "epoch: 86, batch: 0 // loss: 0.181\n", "epoch: 86, batch: 100 // loss: 0.177\n", "epoch: 86, batch: 200 // loss: 0.237\n", "epoch: 86, batch: 300 // loss: 0.210\n", "epoch: 86, batch: 400 // loss: 0.141\n", "epoch: 86, batch: 500 // loss: 0.394\n", "epoch: 86, batch: 600 // loss: 0.321\n", "epoch: 86, batch: 700 // loss: 0.206\n", "epoch: 86, batch: 800 // loss: 0.165\n", "epoch: 86, batch: 900 // loss: 0.064\n", "epoch: 86, batch: 1000 // loss: 0.481\n", "epoch: 86, batch: 1100 // loss: 0.130\n", "epoch: 86, batch: 1200 // loss: 0.122\n", "\n", "epoch: 87, batch: 0 // loss: 0.184\n", "epoch: 87, batch: 100 // loss: 0.180\n", "epoch: 87, batch: 200 // loss: 0.240\n", "epoch: 87, batch: 300 // loss: 0.208\n", "epoch: 87, batch: 400 // loss: 0.140\n", "epoch: 87, batch: 500 // loss: 0.382\n", "epoch: 87, batch: 600 // loss: 0.323\n", "epoch: 87, batch: 700 // loss: 0.211\n", "epoch: 87, batch: 800 // loss: 0.164\n", "epoch: 87, batch: 900 // loss: 0.064\n", "epoch: 87, batch: 1000 // loss: 0.480\n", "epoch: 87, batch: 1100 // loss: 0.136\n", "epoch: 87, batch: 1200 // loss: 0.126\n", "\n", "epoch: 88, batch: 0 // loss: 0.182\n", "epoch: 88, batch: 100 // loss: 0.179\n", "epoch: 88, batch: 200 // loss: 0.231\n", "epoch: 88, batch: 300 // loss: 0.205\n", "epoch: 88, batch: 400 // loss: 0.140\n", "epoch: 88, batch: 500 // loss: 0.388\n", "epoch: 88, batch: 600 // loss: 0.317\n", "epoch: 88, batch: 700 // loss: 0.214\n", "epoch: 88, batch: 800 // loss: 0.166\n", "epoch: 88, batch: 900 // loss: 0.067\n", "epoch: 88, batch: 1000 // loss: 0.466\n", "epoch: 88, batch: 1100 // loss: 0.134\n", "epoch: 88, batch: 1200 // loss: 0.124\n", "\n", "epoch: 89, batch: 0 // loss: 0.186\n", "epoch: 89, batch: 100 // loss: 0.175\n", "epoch: 89, batch: 200 // loss: 0.224\n", "epoch: 89, batch: 300 // loss: 0.209\n", "epoch: 89, batch: 400 // loss: 0.138\n", "epoch: 89, batch: 500 // loss: 0.385\n", "epoch: 89, batch: 600 // loss: 0.315\n", "epoch: 89, batch: 700 // loss: 0.215\n", "epoch: 89, batch: 800 // loss: 0.162\n", "epoch: 89, batch: 900 // loss: 0.065\n", "epoch: 89, batch: 1000 // loss: 0.461\n", "epoch: 89, batch: 1100 // loss: 0.133\n", "epoch: 89, batch: 1200 // loss: 0.124\n", "\n", "epoch: 90, batch: 0 // loss: 0.179\n", "epoch: 90, batch: 100 // loss: 0.175\n", "epoch: 90, batch: 200 // loss: 0.225\n", "epoch: 90, batch: 300 // loss: 0.207\n", "epoch: 90, batch: 400 // loss: 0.140\n", "epoch: 90, batch: 500 // loss: 0.379\n", "epoch: 90, batch: 600 // loss: 0.308\n", "epoch: 90, batch: 700 // loss: 0.208\n", "epoch: 90, batch: 800 // loss: 0.156\n", "epoch: 90, batch: 900 // loss: 0.065\n", "epoch: 90, batch: 1000 // loss: 0.473\n", "epoch: 90, batch: 1100 // loss: 0.131\n", "epoch: 90, batch: 1200 // loss: 0.125\n", "\n", "epoch: 91, batch: 0 // loss: 0.174\n", "epoch: 91, batch: 100 // loss: 0.173\n", "epoch: 91, batch: 200 // loss: 0.222\n", "epoch: 91, batch: 300 // loss: 0.200\n", "epoch: 91, batch: 400 // loss: 0.139\n", "epoch: 91, batch: 500 // loss: 0.379\n", "epoch: 91, batch: 600 // loss: 0.303\n", "epoch: 91, batch: 700 // loss: 0.199\n", "epoch: 91, batch: 800 // loss: 0.153\n", "epoch: 91, batch: 900 // loss: 0.067\n", "epoch: 91, batch: 1000 // loss: 0.455\n", "epoch: 91, batch: 1100 // loss: 0.124\n", "epoch: 91, batch: 1200 // loss: 0.123\n", "\n", "epoch: 92, batch: 0 // loss: 0.176\n", "epoch: 92, batch: 100 // loss: 0.175\n", "epoch: 92, batch: 200 // loss: 0.230\n", "epoch: 92, batch: 300 // loss: 0.205\n", "epoch: 92, batch: 400 // loss: 0.139\n", "epoch: 92, batch: 500 // loss: 0.376\n", "epoch: 92, batch: 600 // loss: 0.295\n", "epoch: 92, batch: 700 // loss: 0.199\n", "epoch: 92, batch: 800 // loss: 0.155\n", "epoch: 92, batch: 900 // loss: 0.068\n", "epoch: 92, batch: 1000 // loss: 0.455\n", "epoch: 92, batch: 1100 // loss: 0.129\n", "epoch: 92, batch: 1200 // loss: 0.123\n", "\n", "epoch: 93, batch: 0 // loss: 0.177\n", "epoch: 93, batch: 100 // loss: 0.176\n", "epoch: 93, batch: 200 // loss: 0.216\n", "epoch: 93, batch: 300 // loss: 0.205\n", "epoch: 93, batch: 400 // loss: 0.137\n", "epoch: 93, batch: 500 // loss: 0.380\n", "epoch: 93, batch: 600 // loss: 0.298\n", "epoch: 93, batch: 700 // loss: 0.211\n", "epoch: 93, batch: 800 // loss: 0.155\n", "epoch: 93, batch: 900 // loss: 0.067\n", "epoch: 93, batch: 1000 // loss: 0.464\n", "epoch: 93, batch: 1100 // loss: 0.127\n", "epoch: 93, batch: 1200 // loss: 0.124\n", "\n", "epoch: 94, batch: 0 // loss: 0.171\n", "epoch: 94, batch: 100 // loss: 0.175\n", "epoch: 94, batch: 200 // loss: 0.228\n", "epoch: 94, batch: 300 // loss: 0.206\n", "epoch: 94, batch: 400 // loss: 0.139\n", "epoch: 94, batch: 500 // loss: 0.372\n", "epoch: 94, batch: 600 // loss: 0.292\n", "epoch: 94, batch: 700 // loss: 0.207\n", "epoch: 94, batch: 800 // loss: 0.156\n", "epoch: 94, batch: 900 // loss: 0.067\n", "epoch: 94, batch: 1000 // loss: 0.446\n", "epoch: 94, batch: 1100 // loss: 0.125\n", "epoch: 94, batch: 1200 // loss: 0.120\n", "\n", "epoch: 95, batch: 0 // loss: 0.178\n", "epoch: 95, batch: 100 // loss: 0.172\n", "epoch: 95, batch: 200 // loss: 0.229\n", "epoch: 95, batch: 300 // loss: 0.205\n", "epoch: 95, batch: 400 // loss: 0.138\n", "epoch: 95, batch: 500 // loss: 0.365\n", "epoch: 95, batch: 600 // loss: 0.292\n", "epoch: 95, batch: 700 // loss: 0.204\n", "epoch: 95, batch: 800 // loss: 0.155\n", "epoch: 95, batch: 900 // loss: 0.068\n", "epoch: 95, batch: 1000 // loss: 0.463\n", "epoch: 95, batch: 1100 // loss: 0.128\n", "epoch: 95, batch: 1200 // loss: 0.123\n", "\n", "epoch: 96, batch: 0 // loss: 0.172\n", "epoch: 96, batch: 100 // loss: 0.178\n", "epoch: 96, batch: 200 // loss: 0.225\n", "epoch: 96, batch: 300 // loss: 0.207\n", "epoch: 96, batch: 400 // loss: 0.140\n", "epoch: 96, batch: 500 // loss: 0.372\n", "epoch: 96, batch: 600 // loss: 0.289\n", "epoch: 96, batch: 700 // loss: 0.199\n", "epoch: 96, batch: 800 // loss: 0.154\n", "epoch: 96, batch: 900 // loss: 0.067\n", "epoch: 96, batch: 1000 // loss: 0.439\n", "epoch: 96, batch: 1100 // loss: 0.124\n", "epoch: 96, batch: 1200 // loss: 0.125\n", "\n", "epoch: 97, batch: 0 // loss: 0.177\n", "epoch: 97, batch: 100 // loss: 0.172\n", "epoch: 97, batch: 200 // loss: 0.231\n", "epoch: 97, batch: 300 // loss: 0.212\n", "epoch: 97, batch: 400 // loss: 0.139\n", "epoch: 97, batch: 500 // loss: 0.364\n", "epoch: 97, batch: 600 // loss: 0.285\n", "epoch: 97, batch: 700 // loss: 0.204\n", "epoch: 97, batch: 800 // loss: 0.155\n", "epoch: 97, batch: 900 // loss: 0.066\n", "epoch: 97, batch: 1000 // loss: 0.446\n", "epoch: 97, batch: 1100 // loss: 0.126\n", "epoch: 97, batch: 1200 // loss: 0.124\n", "\n", "epoch: 98, batch: 0 // loss: 0.185\n", "epoch: 98, batch: 100 // loss: 0.177\n", "epoch: 98, batch: 200 // loss: 0.226\n", "epoch: 98, batch: 300 // loss: 0.211\n", "epoch: 98, batch: 400 // loss: 0.140\n", "epoch: 98, batch: 500 // loss: 0.361\n", "epoch: 98, batch: 600 // loss: 0.286\n", "epoch: 98, batch: 700 // loss: 0.198\n", "epoch: 98, batch: 800 // loss: 0.153\n", "epoch: 98, batch: 900 // loss: 0.066\n", "epoch: 98, batch: 1000 // loss: 0.460\n", "epoch: 98, batch: 1100 // loss: 0.120\n", "epoch: 98, batch: 1200 // loss: 0.126\n", "\n", "epoch: 99, batch: 0 // loss: 0.178\n", "epoch: 99, batch: 100 // loss: 0.176\n", "epoch: 99, batch: 200 // loss: 0.223\n", "epoch: 99, batch: 300 // loss: 0.201\n", "epoch: 99, batch: 400 // loss: 0.140\n", "epoch: 99, batch: 500 // loss: 0.357\n", "epoch: 99, batch: 600 // loss: 0.282\n", "epoch: 99, batch: 700 // loss: 0.197\n", "epoch: 99, batch: 800 // loss: 0.150\n", "epoch: 99, batch: 900 // loss: 0.067\n", "epoch: 99, batch: 1000 // loss: 0.450\n", "epoch: 99, batch: 1100 // loss: 0.120\n", "epoch: 99, batch: 1200 // loss: 0.123\n" ] } ], "source": [ "EPOCHS = 100\n", "for epoch in range(EPOCHS): \n", "\n", " running_loss = 0.0\n", " idx, batch_num = 0, 0\n", " batch_size = 16\n", " \n", " print(\"\")\n", " while idx < 20000:\n", " # zero the parameter gradients\n", " optimizer.zero_grad()\n", " \n", " X_batch = X[idx: idx + batch_size].float()\n", " y_batch = y[idx: idx + batch_size]\n", " idx += batch_size\n", " \n", " # now run our X's forward, get preds, incur\n", " # loss, backprop, and step the optimizer.\n", " y_hat_batch = model(X_batch)\n", " loss = loss_function(y_hat_batch, y_batch)\n", " loss.backward()\n", " optimizer.step()\n", "\n", " # print statistics\n", " running_loss += loss.item()\n", " if batch_num % 100 == 0:\n", " print(\"epoch: {}, batch: {} // loss: {:.3f}\".format(epoch, batch_num, loss.item()))\n", " \n", " batch_num += 1" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "## OK! Now let's come back to auto-encoders" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### TODO 1\n", "\n", "Implement a simple autoencoder in `torch`. In particular, let's start with a vanilla linear auto-encoder, mapping to two dimensions in the hidden space." ] }, { "cell_type": "code", "execution_count": 192, "metadata": {}, "outputs": [], "source": [ "class AE(nn.Module):\n", " \n", " def __init__(self, input_size=784, hidden_size=2):\n", " '''\n", " In the initializer we setup model parameters/layers.\n", " '''\n", " super(AE, self).__init__() \n", "\n", " ### REMOVE BELOW\n", " self.input_size = input_size\n", " self.hidden_size = hidden_size\n", " \n", " # input layer; from x -> z\n", " self.i = nn.Linear(self.input_size, self.hidden_size)\n", " \n", " # output layer\n", " self.o = nn.Linear(self.hidden_size, self.input_size)\n", " \n", "\n", " def forward(self, X, return_z=False):\n", " ### REMOVE BELOW\n", " z = self.i(X)\n", " if return_z:\n", " return z\n", " return self.o(z)" ] }, { "cell_type": "code", "execution_count": 193, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "torch.Size([5, 784])" ] }, "execution_count": 193, "metadata": {}, "output_type": "execute_result" } ], "source": [ "auto = AE(hidden_size=50)\n", "X_tilde = auto(X[:5,:].float())\n", "X_tilde.shape" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### TODO 2 \n", "\n", "Define a training loop -- follow the above example. \n", "\n", "**hint** check out: https://pytorch.org/docs/stable/nn.html#loss-functions" ] }, { "cell_type": "code", "execution_count": 194, "metadata": {}, "outputs": [], "source": [ "def train_AE(X_in, X_target, model, optimizer, loss_function, EPOCHS=10):\n", " for epoch in range(EPOCHS): \n", " idx, batch_num = 0, 0\n", " batch_size = 16\n", "\n", " print(\"\")\n", " while idx < 60000:\n", " # zero the parameter gradients\n", " optimizer.zero_grad()\n", "\n", " X_batch = X_in[idx: idx + batch_size].float()\n", " X_target_batch = X_target[idx: idx + batch_size].float()\n", " idx += batch_size\n", "\n", " # now run our X's forward, get preds, incur\n", " # loss, backprop, and step the optimizer.\n", " X_tilde_batch = model(X_batch)\n", " loss = loss_function(X_tilde_batch, X_target_batch)\n", " loss.backward()\n", " optimizer.step()\n", "\n", " # print out loss\n", " if batch_num % 100 == 0:\n", " print(\"epoch: {}, batch: {} // loss: {:.3f}\".format(epoch, batch_num, loss.item()))\n", "\n", " batch_num += 1" ] }, { "cell_type": "code", "execution_count": 195, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 0.383\n", "epoch: 0, batch: 100 // loss: 0.357\n", "epoch: 0, batch: 200 // loss: 0.321\n", "epoch: 0, batch: 300 // loss: 0.303\n", "epoch: 0, batch: 400 // loss: 0.298\n", "epoch: 0, batch: 500 // loss: 0.288\n", "epoch: 0, batch: 600 // loss: 0.284\n", "epoch: 0, batch: 700 // loss: 0.283\n", "epoch: 0, batch: 800 // loss: 0.248\n", "epoch: 0, batch: 900 // loss: 0.278\n", "epoch: 0, batch: 1000 // loss: 0.245\n", "epoch: 0, batch: 1100 // loss: 0.265\n", "epoch: 0, batch: 1200 // loss: 0.218\n", "epoch: 0, batch: 1300 // loss: 0.243\n", "epoch: 0, batch: 1400 // loss: 0.203\n", "epoch: 0, batch: 1500 // loss: 0.199\n", "epoch: 0, batch: 1600 // loss: 0.214\n", "epoch: 0, batch: 1700 // loss: 0.196\n", "epoch: 0, batch: 1800 // loss: 0.219\n", "epoch: 0, batch: 1900 // loss: 0.192\n", "epoch: 0, batch: 2000 // loss: 0.168\n", "epoch: 0, batch: 2100 // loss: 0.169\n", "epoch: 0, batch: 2200 // loss: 0.195\n", "epoch: 0, batch: 2300 // loss: 0.171\n", "epoch: 0, batch: 2400 // loss: 0.138\n", "epoch: 0, batch: 2500 // loss: 0.140\n", "epoch: 0, batch: 2600 // loss: 0.172\n", "epoch: 0, batch: 2700 // loss: 0.134\n", "epoch: 0, batch: 2800 // loss: 0.167\n", "epoch: 0, batch: 2900 // loss: 0.124\n", "epoch: 0, batch: 3000 // loss: 0.134\n", "epoch: 0, batch: 3100 // loss: 0.151\n", "epoch: 0, batch: 3200 // loss: 0.116\n", "epoch: 0, batch: 3300 // loss: 0.126\n", "epoch: 0, batch: 3400 // loss: 0.123\n", "epoch: 0, batch: 3500 // loss: 0.127\n", "epoch: 0, batch: 3600 // loss: 0.131\n", "epoch: 0, batch: 3700 // loss: 0.140\n", "\n", "epoch: 1, batch: 0 // loss: 0.134\n", "epoch: 1, batch: 100 // loss: 0.127\n", "epoch: 1, batch: 200 // loss: 0.124\n", "epoch: 1, batch: 300 // loss: 0.114\n", "epoch: 1, batch: 400 // loss: 0.116\n", "epoch: 1, batch: 500 // loss: 0.109\n", "epoch: 1, batch: 600 // loss: 0.111\n", "epoch: 1, batch: 700 // loss: 0.115\n", "epoch: 1, batch: 800 // loss: 0.105\n", "epoch: 1, batch: 900 // loss: 0.125\n", "epoch: 1, batch: 1000 // loss: 0.103\n", "epoch: 1, batch: 1100 // loss: 0.120\n", "epoch: 1, batch: 1200 // loss: 0.099\n", "epoch: 1, batch: 1300 // loss: 0.116\n", "epoch: 1, batch: 1400 // loss: 0.097\n", "epoch: 1, batch: 1500 // loss: 0.097\n", "epoch: 1, batch: 1600 // loss: 0.109\n", "epoch: 1, batch: 1700 // loss: 0.105\n", "epoch: 1, batch: 1800 // loss: 0.114\n", "epoch: 1, batch: 1900 // loss: 0.102\n", "epoch: 1, batch: 2000 // loss: 0.090\n", "epoch: 1, batch: 2100 // loss: 0.097\n", "epoch: 1, batch: 2200 // loss: 0.114\n", "epoch: 1, batch: 2300 // loss: 0.101\n", "epoch: 1, batch: 2400 // loss: 0.084\n", "epoch: 1, batch: 2500 // loss: 0.083\n", "epoch: 1, batch: 2600 // loss: 0.106\n", "epoch: 1, batch: 2700 // loss: 0.083\n", "epoch: 1, batch: 2800 // loss: 0.108\n", "epoch: 1, batch: 2900 // loss: 0.080\n", "epoch: 1, batch: 3000 // loss: 0.088\n", "epoch: 1, batch: 3100 // loss: 0.098\n", "epoch: 1, batch: 3200 // loss: 0.081\n", "epoch: 1, batch: 3300 // loss: 0.086\n", "epoch: 1, batch: 3400 // loss: 0.082\n", "epoch: 1, batch: 3500 // loss: 0.089\n", "epoch: 1, batch: 3600 // loss: 0.095\n", "epoch: 1, batch: 3700 // loss: 0.101\n", "\n", "epoch: 2, batch: 0 // loss: 0.103\n", "epoch: 2, batch: 100 // loss: 0.091\n", "epoch: 2, batch: 200 // loss: 0.098\n", "epoch: 2, batch: 300 // loss: 0.089\n", "epoch: 2, batch: 400 // loss: 0.090\n", "epoch: 2, batch: 500 // loss: 0.083\n", "epoch: 2, batch: 600 // loss: 0.085\n", "epoch: 2, batch: 700 // loss: 0.089\n", "epoch: 2, batch: 800 // loss: 0.087\n", "epoch: 2, batch: 900 // loss: 0.101\n", "epoch: 2, batch: 1000 // loss: 0.082\n", "epoch: 2, batch: 1100 // loss: 0.095\n", "epoch: 2, batch: 1200 // loss: 0.084\n", "epoch: 2, batch: 1300 // loss: 0.096\n", "epoch: 2, batch: 1400 // loss: 0.083\n", "epoch: 2, batch: 1500 // loss: 0.083\n", "epoch: 2, batch: 1600 // loss: 0.093\n", "epoch: 2, batch: 1700 // loss: 0.093\n", "epoch: 2, batch: 1800 // loss: 0.095\n", "epoch: 2, batch: 1900 // loss: 0.088\n", "epoch: 2, batch: 2000 // loss: 0.079\n", "epoch: 2, batch: 2100 // loss: 0.088\n", "epoch: 2, batch: 2200 // loss: 0.100\n", "epoch: 2, batch: 2300 // loss: 0.091\n", "epoch: 2, batch: 2400 // loss: 0.080\n", "epoch: 2, batch: 2500 // loss: 0.076\n", "epoch: 2, batch: 2600 // loss: 0.095\n", "epoch: 2, batch: 2700 // loss: 0.077\n", "epoch: 2, batch: 2800 // loss: 0.098\n", "epoch: 2, batch: 2900 // loss: 0.076\n", "epoch: 2, batch: 3000 // loss: 0.083\n", "epoch: 2, batch: 3100 // loss: 0.090\n", "epoch: 2, batch: 3200 // loss: 0.079\n", "epoch: 2, batch: 3300 // loss: 0.080\n", "epoch: 2, batch: 3400 // loss: 0.076\n", "epoch: 2, batch: 3500 // loss: 0.083\n", "epoch: 2, batch: 3600 // loss: 0.091\n", "epoch: 2, batch: 3700 // loss: 0.094\n", "\n", "epoch: 3, batch: 0 // loss: 0.099\n", "epoch: 3, batch: 100 // loss: 0.085\n", "epoch: 3, batch: 200 // loss: 0.095\n", "epoch: 3, batch: 300 // loss: 0.086\n", "epoch: 3, batch: 400 // loss: 0.087\n", "epoch: 3, batch: 500 // loss: 0.079\n", "epoch: 3, batch: 600 // loss: 0.081\n", "epoch: 3, batch: 700 // loss: 0.085\n", "epoch: 3, batch: 800 // loss: 0.085\n", "epoch: 3, batch: 900 // loss: 0.096\n", "epoch: 3, batch: 1000 // loss: 0.078\n", "epoch: 3, batch: 1100 // loss: 0.090\n", "epoch: 3, batch: 1200 // loss: 0.082\n", "epoch: 3, batch: 1300 // loss: 0.092\n", "epoch: 3, batch: 1400 // loss: 0.082\n", "epoch: 3, batch: 1500 // loss: 0.082\n", "epoch: 3, batch: 1600 // loss: 0.090\n", "epoch: 3, batch: 1700 // loss: 0.091\n", "epoch: 3, batch: 1800 // loss: 0.092\n", "epoch: 3, batch: 1900 // loss: 0.086\n", "epoch: 3, batch: 2000 // loss: 0.078\n", "epoch: 3, batch: 2100 // loss: 0.088\n", "epoch: 3, batch: 2200 // loss: 0.098\n", "epoch: 3, batch: 2300 // loss: 0.090\n", "epoch: 3, batch: 2400 // loss: 0.081\n", "epoch: 3, batch: 2500 // loss: 0.076\n", "epoch: 3, batch: 2600 // loss: 0.093\n", "epoch: 3, batch: 2700 // loss: 0.077\n", "epoch: 3, batch: 2800 // loss: 0.096\n", "epoch: 3, batch: 2900 // loss: 0.076\n", "epoch: 3, batch: 3000 // loss: 0.082\n", "epoch: 3, batch: 3100 // loss: 0.088\n", "epoch: 3, batch: 3200 // loss: 0.079\n", "epoch: 3, batch: 3300 // loss: 0.079\n", "epoch: 3, batch: 3400 // loss: 0.076\n", "epoch: 3, batch: 3500 // loss: 0.082\n", "epoch: 3, batch: 3600 // loss: 0.090\n", "epoch: 3, batch: 3700 // loss: 0.092\n", "\n", "epoch: 4, batch: 0 // loss: 0.098\n", "epoch: 4, batch: 100 // loss: 0.084\n", "epoch: 4, batch: 200 // loss: 0.095\n", "epoch: 4, batch: 300 // loss: 0.086\n", "epoch: 4, batch: 400 // loss: 0.087\n", "epoch: 4, batch: 500 // loss: 0.078\n", "epoch: 4, batch: 600 // loss: 0.081\n", "epoch: 4, batch: 700 // loss: 0.084\n", "epoch: 4, batch: 800 // loss: 0.085\n", "epoch: 4, batch: 900 // loss: 0.096\n", "epoch: 4, batch: 1000 // loss: 0.077\n", "epoch: 4, batch: 1100 // loss: 0.089\n", "epoch: 4, batch: 1200 // loss: 0.082\n", "epoch: 4, batch: 1300 // loss: 0.091\n", "epoch: 4, batch: 1400 // loss: 0.082\n", "epoch: 4, batch: 1500 // loss: 0.082\n", "epoch: 4, batch: 1600 // loss: 0.090\n", "epoch: 4, batch: 1700 // loss: 0.091\n", "epoch: 4, batch: 1800 // loss: 0.090\n", "epoch: 4, batch: 1900 // loss: 0.085\n", "epoch: 4, batch: 2000 // loss: 0.078\n", "epoch: 4, batch: 2100 // loss: 0.088\n", "epoch: 4, batch: 2200 // loss: 0.097\n", "epoch: 4, batch: 2300 // loss: 0.089\n", "epoch: 4, batch: 2400 // loss: 0.081\n", "epoch: 4, batch: 2500 // loss: 0.076\n", "epoch: 4, batch: 2600 // loss: 0.092\n", "epoch: 4, batch: 2700 // loss: 0.077\n", "epoch: 4, batch: 2800 // loss: 0.096\n", "epoch: 4, batch: 2900 // loss: 0.076\n", "epoch: 4, batch: 3000 // loss: 0.082\n", "epoch: 4, batch: 3100 // loss: 0.087\n", "epoch: 4, batch: 3200 // loss: 0.080\n", "epoch: 4, batch: 3300 // loss: 0.079\n", "epoch: 4, batch: 3400 // loss: 0.075\n", "epoch: 4, batch: 3500 // loss: 0.082\n", "epoch: 4, batch: 3600 // loss: 0.090\n", "epoch: 4, batch: 3700 // loss: 0.092\n", "\n", "epoch: 5, batch: 0 // loss: 0.098\n", "epoch: 5, batch: 100 // loss: 0.083\n", "epoch: 5, batch: 200 // loss: 0.095\n", "epoch: 5, batch: 300 // loss: 0.086\n", "epoch: 5, batch: 400 // loss: 0.087\n", "epoch: 5, batch: 500 // loss: 0.078\n", "epoch: 5, batch: 600 // loss: 0.080\n", "epoch: 5, batch: 700 // loss: 0.084\n", "epoch: 5, batch: 800 // loss: 0.085\n", "epoch: 5, batch: 900 // loss: 0.095\n", "epoch: 5, batch: 1000 // loss: 0.077\n", "epoch: 5, batch: 1100 // loss: 0.088\n", "epoch: 5, batch: 1200 // loss: 0.082\n", "epoch: 5, batch: 1300 // loss: 0.091\n", "epoch: 5, batch: 1400 // loss: 0.082\n", "epoch: 5, batch: 1500 // loss: 0.082\n", "epoch: 5, batch: 1600 // loss: 0.090\n", "epoch: 5, batch: 1700 // loss: 0.091\n", "epoch: 5, batch: 1800 // loss: 0.090\n", "epoch: 5, batch: 1900 // loss: 0.085\n", "epoch: 5, batch: 2000 // loss: 0.078\n", "epoch: 5, batch: 2100 // loss: 0.088\n", "epoch: 5, batch: 2200 // loss: 0.097\n", "epoch: 5, batch: 2300 // loss: 0.089\n", "epoch: 5, batch: 2400 // loss: 0.081\n", "epoch: 5, batch: 2500 // loss: 0.076\n", "epoch: 5, batch: 2600 // loss: 0.092\n", "epoch: 5, batch: 2700 // loss: 0.077\n", "epoch: 5, batch: 2800 // loss: 0.096\n", "epoch: 5, batch: 2900 // loss: 0.076\n", "epoch: 5, batch: 3000 // loss: 0.082\n", "epoch: 5, batch: 3100 // loss: 0.087\n", "epoch: 5, batch: 3200 // loss: 0.080\n", "epoch: 5, batch: 3300 // loss: 0.079\n", "epoch: 5, batch: 3400 // loss: 0.075\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 5, batch: 3500 // loss: 0.082\n", "epoch: 5, batch: 3600 // loss: 0.090\n", "epoch: 5, batch: 3700 // loss: 0.092\n", "\n", "epoch: 6, batch: 0 // loss: 0.098\n", "epoch: 6, batch: 100 // loss: 0.083\n", "epoch: 6, batch: 200 // loss: 0.095\n", "epoch: 6, batch: 300 // loss: 0.086\n", "epoch: 6, batch: 400 // loss: 0.087\n", "epoch: 6, batch: 500 // loss: 0.078\n", "epoch: 6, batch: 600 // loss: 0.080\n", "epoch: 6, batch: 700 // loss: 0.083\n", "epoch: 6, batch: 800 // loss: 0.085\n", "epoch: 6, batch: 900 // loss: 0.095\n", "epoch: 6, batch: 1000 // loss: 0.077\n", "epoch: 6, batch: 1100 // loss: 0.088\n", "epoch: 6, batch: 1200 // loss: 0.082\n", "epoch: 6, batch: 1300 // loss: 0.091\n", "epoch: 6, batch: 1400 // loss: 0.082\n", "epoch: 6, batch: 1500 // loss: 0.082\n", "epoch: 6, batch: 1600 // loss: 0.089\n", "epoch: 6, batch: 1700 // loss: 0.091\n", "epoch: 6, batch: 1800 // loss: 0.090\n", "epoch: 6, batch: 1900 // loss: 0.085\n", "epoch: 6, batch: 2000 // loss: 0.078\n", "epoch: 6, batch: 2100 // loss: 0.088\n", "epoch: 6, batch: 2200 // loss: 0.096\n", "epoch: 6, batch: 2300 // loss: 0.089\n", "epoch: 6, batch: 2400 // loss: 0.081\n", "epoch: 6, batch: 2500 // loss: 0.076\n", "epoch: 6, batch: 2600 // loss: 0.092\n", "epoch: 6, batch: 2700 // loss: 0.077\n", "epoch: 6, batch: 2800 // loss: 0.095\n", "epoch: 6, batch: 2900 // loss: 0.076\n", "epoch: 6, batch: 3000 // loss: 0.082\n", "epoch: 6, batch: 3100 // loss: 0.087\n", "epoch: 6, batch: 3200 // loss: 0.080\n", "epoch: 6, batch: 3300 // loss: 0.079\n", "epoch: 6, batch: 3400 // loss: 0.075\n", "epoch: 6, batch: 3500 // loss: 0.081\n", "epoch: 6, batch: 3600 // loss: 0.090\n", "epoch: 6, batch: 3700 // loss: 0.092\n", "\n", "epoch: 7, batch: 0 // loss: 0.098\n", "epoch: 7, batch: 100 // loss: 0.083\n", "epoch: 7, batch: 200 // loss: 0.095\n", "epoch: 7, batch: 300 // loss: 0.086\n", "epoch: 7, batch: 400 // loss: 0.087\n", "epoch: 7, batch: 500 // loss: 0.078\n", "epoch: 7, batch: 600 // loss: 0.080\n", "epoch: 7, batch: 700 // loss: 0.083\n", "epoch: 7, batch: 800 // loss: 0.085\n", "epoch: 7, batch: 900 // loss: 0.095\n", "epoch: 7, batch: 1000 // loss: 0.077\n", "epoch: 7, batch: 1100 // loss: 0.088\n", "epoch: 7, batch: 1200 // loss: 0.082\n", "epoch: 7, batch: 1300 // loss: 0.090\n", "epoch: 7, batch: 1400 // loss: 0.082\n", "epoch: 7, batch: 1500 // loss: 0.082\n", "epoch: 7, batch: 1600 // loss: 0.089\n", "epoch: 7, batch: 1700 // loss: 0.090\n", "epoch: 7, batch: 1800 // loss: 0.090\n", "epoch: 7, batch: 1900 // loss: 0.085\n", "epoch: 7, batch: 2000 // loss: 0.078\n", "epoch: 7, batch: 2100 // loss: 0.088\n", "epoch: 7, batch: 2200 // loss: 0.096\n", "epoch: 7, batch: 2300 // loss: 0.089\n", "epoch: 7, batch: 2400 // loss: 0.081\n", "epoch: 7, batch: 2500 // loss: 0.076\n", "epoch: 7, batch: 2600 // loss: 0.091\n", "epoch: 7, batch: 2700 // loss: 0.077\n", "epoch: 7, batch: 2800 // loss: 0.095\n", "epoch: 7, batch: 2900 // loss: 0.076\n", "epoch: 7, batch: 3000 // loss: 0.082\n", "epoch: 7, batch: 3100 // loss: 0.087\n", "epoch: 7, batch: 3200 // loss: 0.080\n", "epoch: 7, batch: 3300 // loss: 0.079\n", "epoch: 7, batch: 3400 // loss: 0.075\n", "epoch: 7, batch: 3500 // loss: 0.081\n", "epoch: 7, batch: 3600 // loss: 0.089\n", "epoch: 7, batch: 3700 // loss: 0.091\n", "\n", "epoch: 8, batch: 0 // loss: 0.098\n", "epoch: 8, batch: 100 // loss: 0.082\n", "epoch: 8, batch: 200 // loss: 0.095\n", "epoch: 8, batch: 300 // loss: 0.086\n", "epoch: 8, batch: 400 // loss: 0.087\n", "epoch: 8, batch: 500 // loss: 0.078\n", "epoch: 8, batch: 600 // loss: 0.080\n", "epoch: 8, batch: 700 // loss: 0.083\n", "epoch: 8, batch: 800 // loss: 0.085\n", "epoch: 8, batch: 900 // loss: 0.094\n", "epoch: 8, batch: 1000 // loss: 0.077\n", "epoch: 8, batch: 1100 // loss: 0.088\n", "epoch: 8, batch: 1200 // loss: 0.082\n", "epoch: 8, batch: 1300 // loss: 0.090\n", "epoch: 8, batch: 1400 // loss: 0.082\n", "epoch: 8, batch: 1500 // loss: 0.081\n", "epoch: 8, batch: 1600 // loss: 0.089\n", "epoch: 8, batch: 1700 // loss: 0.090\n", "epoch: 8, batch: 1800 // loss: 0.089\n", "epoch: 8, batch: 1900 // loss: 0.085\n", "epoch: 8, batch: 2000 // loss: 0.078\n", "epoch: 8, batch: 2100 // loss: 0.087\n", "epoch: 8, batch: 2200 // loss: 0.096\n", "epoch: 8, batch: 2300 // loss: 0.089\n", "epoch: 8, batch: 2400 // loss: 0.081\n", "epoch: 8, batch: 2500 // loss: 0.076\n", "epoch: 8, batch: 2600 // loss: 0.091\n", "epoch: 8, batch: 2700 // loss: 0.076\n", "epoch: 8, batch: 2800 // loss: 0.095\n", "epoch: 8, batch: 2900 // loss: 0.076\n", "epoch: 8, batch: 3000 // loss: 0.081\n", "epoch: 8, batch: 3100 // loss: 0.086\n", "epoch: 8, batch: 3200 // loss: 0.079\n", "epoch: 8, batch: 3300 // loss: 0.079\n", "epoch: 8, batch: 3400 // loss: 0.075\n", "epoch: 8, batch: 3500 // loss: 0.081\n", "epoch: 8, batch: 3600 // loss: 0.089\n", "epoch: 8, batch: 3700 // loss: 0.091\n", "\n", "epoch: 9, batch: 0 // loss: 0.097\n", "epoch: 9, batch: 100 // loss: 0.082\n", "epoch: 9, batch: 200 // loss: 0.094\n", "epoch: 9, batch: 300 // loss: 0.085\n", "epoch: 9, batch: 400 // loss: 0.086\n", "epoch: 9, batch: 500 // loss: 0.077\n", "epoch: 9, batch: 600 // loss: 0.079\n", "epoch: 9, batch: 700 // loss: 0.083\n", "epoch: 9, batch: 800 // loss: 0.084\n", "epoch: 9, batch: 900 // loss: 0.094\n", "epoch: 9, batch: 1000 // loss: 0.076\n", "epoch: 9, batch: 1100 // loss: 0.087\n", "epoch: 9, batch: 1200 // loss: 0.082\n", "epoch: 9, batch: 1300 // loss: 0.090\n", "epoch: 9, batch: 1400 // loss: 0.082\n", "epoch: 9, batch: 1500 // loss: 0.081\n", "epoch: 9, batch: 1600 // loss: 0.089\n", "epoch: 9, batch: 1700 // loss: 0.090\n", "epoch: 9, batch: 1800 // loss: 0.089\n", "epoch: 9, batch: 1900 // loss: 0.084\n", "epoch: 9, batch: 2000 // loss: 0.078\n", "epoch: 9, batch: 2100 // loss: 0.087\n", "epoch: 9, batch: 2200 // loss: 0.095\n", "epoch: 9, batch: 2300 // loss: 0.088\n", "epoch: 9, batch: 2400 // loss: 0.081\n", "epoch: 9, batch: 2500 // loss: 0.075\n", "epoch: 9, batch: 2600 // loss: 0.091\n", "epoch: 9, batch: 2700 // loss: 0.076\n", "epoch: 9, batch: 2800 // loss: 0.094\n", "epoch: 9, batch: 2900 // loss: 0.075\n", "epoch: 9, batch: 3000 // loss: 0.081\n", "epoch: 9, batch: 3100 // loss: 0.086\n", "epoch: 9, batch: 3200 // loss: 0.079\n", "epoch: 9, batch: 3300 // loss: 0.078\n", "epoch: 9, batch: 3400 // loss: 0.075\n", "epoch: 9, batch: 3500 // loss: 0.080\n", "epoch: 9, batch: 3600 // loss: 0.089\n", "epoch: 9, batch: 3700 // loss: 0.091\n", "\n", "epoch: 10, batch: 0 // loss: 0.097\n", "epoch: 10, batch: 100 // loss: 0.082\n", "epoch: 10, batch: 200 // loss: 0.094\n", "epoch: 10, batch: 300 // loss: 0.085\n", "epoch: 10, batch: 400 // loss: 0.086\n", "epoch: 10, batch: 500 // loss: 0.077\n", "epoch: 10, batch: 600 // loss: 0.079\n", "epoch: 10, batch: 700 // loss: 0.082\n", "epoch: 10, batch: 800 // loss: 0.084\n", "epoch: 10, batch: 900 // loss: 0.094\n", "epoch: 10, batch: 1000 // loss: 0.076\n", "epoch: 10, batch: 1100 // loss: 0.087\n", "epoch: 10, batch: 1200 // loss: 0.081\n", "epoch: 10, batch: 1300 // loss: 0.089\n", "epoch: 10, batch: 1400 // loss: 0.081\n", "epoch: 10, batch: 1500 // loss: 0.081\n", "epoch: 10, batch: 1600 // loss: 0.088\n", "epoch: 10, batch: 1700 // loss: 0.089\n", "epoch: 10, batch: 1800 // loss: 0.089\n", "epoch: 10, batch: 1900 // loss: 0.084\n", "epoch: 10, batch: 2000 // loss: 0.077\n", "epoch: 10, batch: 2100 // loss: 0.087\n", "epoch: 10, batch: 2200 // loss: 0.095\n", "epoch: 10, batch: 2300 // loss: 0.088\n", "epoch: 10, batch: 2400 // loss: 0.081\n", "epoch: 10, batch: 2500 // loss: 0.075\n", "epoch: 10, batch: 2600 // loss: 0.090\n", "epoch: 10, batch: 2700 // loss: 0.076\n", "epoch: 10, batch: 2800 // loss: 0.094\n", "epoch: 10, batch: 2900 // loss: 0.075\n", "epoch: 10, batch: 3000 // loss: 0.081\n", "epoch: 10, batch: 3100 // loss: 0.085\n", "epoch: 10, batch: 3200 // loss: 0.079\n", "epoch: 10, batch: 3300 // loss: 0.078\n", "epoch: 10, batch: 3400 // loss: 0.074\n", "epoch: 10, batch: 3500 // loss: 0.080\n", "epoch: 10, batch: 3600 // loss: 0.088\n", "epoch: 10, batch: 3700 // loss: 0.090\n", "\n", "epoch: 11, batch: 0 // loss: 0.096\n", "epoch: 11, batch: 100 // loss: 0.081\n", "epoch: 11, batch: 200 // loss: 0.093\n", "epoch: 11, batch: 300 // loss: 0.085\n", "epoch: 11, batch: 400 // loss: 0.085\n", "epoch: 11, batch: 500 // loss: 0.076\n", "epoch: 11, batch: 600 // loss: 0.078\n", "epoch: 11, batch: 700 // loss: 0.082\n", "epoch: 11, batch: 800 // loss: 0.083\n", "epoch: 11, batch: 900 // loss: 0.093\n", "epoch: 11, batch: 1000 // loss: 0.076\n", "epoch: 11, batch: 1100 // loss: 0.086\n", "epoch: 11, batch: 1200 // loss: 0.081\n", "epoch: 11, batch: 1300 // loss: 0.088\n", "epoch: 11, batch: 1400 // loss: 0.081\n", "epoch: 11, batch: 1500 // loss: 0.081\n", "epoch: 11, batch: 1600 // loss: 0.088\n", "epoch: 11, batch: 1700 // loss: 0.088\n", "epoch: 11, batch: 1800 // loss: 0.088\n", "epoch: 11, batch: 1900 // loss: 0.084\n", "epoch: 11, batch: 2000 // loss: 0.077\n", "epoch: 11, batch: 2100 // loss: 0.086\n", "epoch: 11, batch: 2200 // loss: 0.094\n", "epoch: 11, batch: 2300 // loss: 0.087\n", "epoch: 11, batch: 2400 // loss: 0.080\n", "epoch: 11, batch: 2500 // loss: 0.075\n", "epoch: 11, batch: 2600 // loss: 0.089\n", "epoch: 11, batch: 2700 // loss: 0.075\n", "epoch: 11, batch: 2800 // loss: 0.093\n", "epoch: 11, batch: 2900 // loss: 0.075\n", "epoch: 11, batch: 3000 // loss: 0.080\n", "epoch: 11, batch: 3100 // loss: 0.085\n", "epoch: 11, batch: 3200 // loss: 0.078\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 11, batch: 3300 // loss: 0.077\n", "epoch: 11, batch: 3400 // loss: 0.074\n", "epoch: 11, batch: 3500 // loss: 0.079\n", "epoch: 11, batch: 3600 // loss: 0.087\n", "epoch: 11, batch: 3700 // loss: 0.089\n", "\n", "epoch: 12, batch: 0 // loss: 0.096\n", "epoch: 12, batch: 100 // loss: 0.081\n", "epoch: 12, batch: 200 // loss: 0.092\n", "epoch: 12, batch: 300 // loss: 0.084\n", "epoch: 12, batch: 400 // loss: 0.085\n", "epoch: 12, batch: 500 // loss: 0.076\n", "epoch: 12, batch: 600 // loss: 0.078\n", "epoch: 12, batch: 700 // loss: 0.081\n", "epoch: 12, batch: 800 // loss: 0.083\n", "epoch: 12, batch: 900 // loss: 0.092\n", "epoch: 12, batch: 1000 // loss: 0.075\n", "epoch: 12, batch: 1100 // loss: 0.085\n", "epoch: 12, batch: 1200 // loss: 0.081\n", "epoch: 12, batch: 1300 // loss: 0.088\n", "epoch: 12, batch: 1400 // loss: 0.080\n", "epoch: 12, batch: 1500 // loss: 0.080\n", "epoch: 12, batch: 1600 // loss: 0.087\n", "epoch: 12, batch: 1700 // loss: 0.087\n", "epoch: 12, batch: 1800 // loss: 0.088\n", "epoch: 12, batch: 1900 // loss: 0.083\n", "epoch: 12, batch: 2000 // loss: 0.077\n", "epoch: 12, batch: 2100 // loss: 0.086\n", "epoch: 12, batch: 2200 // loss: 0.093\n", "epoch: 12, batch: 2300 // loss: 0.086\n", "epoch: 12, batch: 2400 // loss: 0.080\n", "epoch: 12, batch: 2500 // loss: 0.074\n", "epoch: 12, batch: 2600 // loss: 0.088\n", "epoch: 12, batch: 2700 // loss: 0.075\n", "epoch: 12, batch: 2800 // loss: 0.092\n", "epoch: 12, batch: 2900 // loss: 0.074\n", "epoch: 12, batch: 3000 // loss: 0.079\n", "epoch: 12, batch: 3100 // loss: 0.084\n", "epoch: 12, batch: 3200 // loss: 0.078\n", "epoch: 12, batch: 3300 // loss: 0.077\n", "epoch: 12, batch: 3400 // loss: 0.073\n", "epoch: 12, batch: 3500 // loss: 0.078\n", "epoch: 12, batch: 3600 // loss: 0.086\n", "epoch: 12, batch: 3700 // loss: 0.089\n", "\n", "epoch: 13, batch: 0 // loss: 0.095\n", "epoch: 13, batch: 100 // loss: 0.080\n", "epoch: 13, batch: 200 // loss: 0.091\n", "epoch: 13, batch: 300 // loss: 0.084\n", "epoch: 13, batch: 400 // loss: 0.084\n", "epoch: 13, batch: 500 // loss: 0.075\n", "epoch: 13, batch: 600 // loss: 0.077\n", "epoch: 13, batch: 700 // loss: 0.080\n", "epoch: 13, batch: 800 // loss: 0.082\n", "epoch: 13, batch: 900 // loss: 0.091\n", "epoch: 13, batch: 1000 // loss: 0.075\n", "epoch: 13, batch: 1100 // loss: 0.084\n", "epoch: 13, batch: 1200 // loss: 0.080\n", "epoch: 13, batch: 1300 // loss: 0.087\n", "epoch: 13, batch: 1400 // loss: 0.079\n", "epoch: 13, batch: 1500 // loss: 0.080\n", "epoch: 13, batch: 1600 // loss: 0.087\n", "epoch: 13, batch: 1700 // loss: 0.086\n", "epoch: 13, batch: 1800 // loss: 0.087\n", "epoch: 13, batch: 1900 // loss: 0.082\n", "epoch: 13, batch: 2000 // loss: 0.076\n", "epoch: 13, batch: 2100 // loss: 0.085\n", "epoch: 13, batch: 2200 // loss: 0.092\n", "epoch: 13, batch: 2300 // loss: 0.085\n", "epoch: 13, batch: 2400 // loss: 0.079\n", "epoch: 13, batch: 2500 // loss: 0.073\n", "epoch: 13, batch: 2600 // loss: 0.087\n", "epoch: 13, batch: 2700 // loss: 0.074\n", "epoch: 13, batch: 2800 // loss: 0.091\n", "epoch: 13, batch: 2900 // loss: 0.073\n", "epoch: 13, batch: 3000 // loss: 0.078\n", "epoch: 13, batch: 3100 // loss: 0.083\n", "epoch: 13, batch: 3200 // loss: 0.077\n", "epoch: 13, batch: 3300 // loss: 0.076\n", "epoch: 13, batch: 3400 // loss: 0.073\n", "epoch: 13, batch: 3500 // loss: 0.077\n", "epoch: 13, batch: 3600 // loss: 0.085\n", "epoch: 13, batch: 3700 // loss: 0.088\n", "\n", "epoch: 14, batch: 0 // loss: 0.094\n", "epoch: 14, batch: 100 // loss: 0.079\n", "epoch: 14, batch: 200 // loss: 0.090\n", "epoch: 14, batch: 300 // loss: 0.083\n", "epoch: 14, batch: 400 // loss: 0.083\n", "epoch: 14, batch: 500 // loss: 0.074\n", "epoch: 14, batch: 600 // loss: 0.076\n", "epoch: 14, batch: 700 // loss: 0.079\n", "epoch: 14, batch: 800 // loss: 0.081\n", "epoch: 14, batch: 900 // loss: 0.090\n", "epoch: 14, batch: 1000 // loss: 0.074\n", "epoch: 14, batch: 1100 // loss: 0.083\n", "epoch: 14, batch: 1200 // loss: 0.079\n", "epoch: 14, batch: 1300 // loss: 0.085\n", "epoch: 14, batch: 1400 // loss: 0.079\n", "epoch: 14, batch: 1500 // loss: 0.079\n", "epoch: 14, batch: 1600 // loss: 0.086\n", "epoch: 14, batch: 1700 // loss: 0.085\n", "epoch: 14, batch: 1800 // loss: 0.086\n", "epoch: 14, batch: 1900 // loss: 0.081\n", "epoch: 14, batch: 2000 // loss: 0.076\n", "epoch: 14, batch: 2100 // loss: 0.084\n", "epoch: 14, batch: 2200 // loss: 0.091\n", "epoch: 14, batch: 2300 // loss: 0.084\n", "epoch: 14, batch: 2400 // loss: 0.078\n", "epoch: 14, batch: 2500 // loss: 0.073\n", "epoch: 14, batch: 2600 // loss: 0.086\n", "epoch: 14, batch: 2700 // loss: 0.073\n", "epoch: 14, batch: 2800 // loss: 0.090\n", "epoch: 14, batch: 2900 // loss: 0.073\n", "epoch: 14, batch: 3000 // loss: 0.077\n", "epoch: 14, batch: 3100 // loss: 0.082\n", "epoch: 14, batch: 3200 // loss: 0.076\n", "epoch: 14, batch: 3300 // loss: 0.075\n", "epoch: 14, batch: 3400 // loss: 0.072\n", "epoch: 14, batch: 3500 // loss: 0.075\n", "epoch: 14, batch: 3600 // loss: 0.084\n", "epoch: 14, batch: 3700 // loss: 0.086\n", "\n", "epoch: 15, batch: 0 // loss: 0.092\n", "epoch: 15, batch: 100 // loss: 0.078\n", "epoch: 15, batch: 200 // loss: 0.088\n", "epoch: 15, batch: 300 // loss: 0.082\n", "epoch: 15, batch: 400 // loss: 0.082\n", "epoch: 15, batch: 500 // loss: 0.073\n", "epoch: 15, batch: 600 // loss: 0.074\n", "epoch: 15, batch: 700 // loss: 0.078\n", "epoch: 15, batch: 800 // loss: 0.080\n", "epoch: 15, batch: 900 // loss: 0.089\n", "epoch: 15, batch: 1000 // loss: 0.073\n", "epoch: 15, batch: 1100 // loss: 0.081\n", "epoch: 15, batch: 1200 // loss: 0.079\n", "epoch: 15, batch: 1300 // loss: 0.084\n", "epoch: 15, batch: 1400 // loss: 0.077\n", "epoch: 15, batch: 1500 // loss: 0.079\n", "epoch: 15, batch: 1600 // loss: 0.085\n", "epoch: 15, batch: 1700 // loss: 0.083\n", "epoch: 15, batch: 1800 // loss: 0.085\n", "epoch: 15, batch: 1900 // loss: 0.080\n", "epoch: 15, batch: 2000 // loss: 0.075\n", "epoch: 15, batch: 2100 // loss: 0.083\n", "epoch: 15, batch: 2200 // loss: 0.089\n", "epoch: 15, batch: 2300 // loss: 0.083\n", "epoch: 15, batch: 2400 // loss: 0.077\n", "epoch: 15, batch: 2500 // loss: 0.072\n", "epoch: 15, batch: 2600 // loss: 0.084\n", "epoch: 15, batch: 2700 // loss: 0.072\n", "epoch: 15, batch: 2800 // loss: 0.089\n", "epoch: 15, batch: 2900 // loss: 0.072\n", "epoch: 15, batch: 3000 // loss: 0.076\n", "epoch: 15, batch: 3100 // loss: 0.081\n", "epoch: 15, batch: 3200 // loss: 0.075\n", "epoch: 15, batch: 3300 // loss: 0.073\n", "epoch: 15, batch: 3400 // loss: 0.071\n", "epoch: 15, batch: 3500 // loss: 0.074\n", "epoch: 15, batch: 3600 // loss: 0.082\n", "epoch: 15, batch: 3700 // loss: 0.085\n", "\n", "epoch: 16, batch: 0 // loss: 0.091\n", "epoch: 16, batch: 100 // loss: 0.077\n", "epoch: 16, batch: 200 // loss: 0.086\n", "epoch: 16, batch: 300 // loss: 0.081\n", "epoch: 16, batch: 400 // loss: 0.081\n", "epoch: 16, batch: 500 // loss: 0.072\n", "epoch: 16, batch: 600 // loss: 0.073\n", "epoch: 16, batch: 700 // loss: 0.077\n", "epoch: 16, batch: 800 // loss: 0.078\n", "epoch: 16, batch: 900 // loss: 0.087\n", "epoch: 16, batch: 1000 // loss: 0.072\n", "epoch: 16, batch: 1100 // loss: 0.080\n", "epoch: 16, batch: 1200 // loss: 0.078\n", "epoch: 16, batch: 1300 // loss: 0.083\n", "epoch: 16, batch: 1400 // loss: 0.076\n", "epoch: 16, batch: 1500 // loss: 0.078\n", "epoch: 16, batch: 1600 // loss: 0.083\n", "epoch: 16, batch: 1700 // loss: 0.081\n", "epoch: 16, batch: 1800 // loss: 0.084\n", "epoch: 16, batch: 1900 // loss: 0.079\n", "epoch: 16, batch: 2000 // loss: 0.074\n", "epoch: 16, batch: 2100 // loss: 0.082\n", "epoch: 16, batch: 2200 // loss: 0.087\n", "epoch: 16, batch: 2300 // loss: 0.082\n", "epoch: 16, batch: 2400 // loss: 0.076\n", "epoch: 16, batch: 2500 // loss: 0.071\n", "epoch: 16, batch: 2600 // loss: 0.082\n", "epoch: 16, batch: 2700 // loss: 0.071\n", "epoch: 16, batch: 2800 // loss: 0.087\n", "epoch: 16, batch: 2900 // loss: 0.071\n", "epoch: 16, batch: 3000 // loss: 0.074\n", "epoch: 16, batch: 3100 // loss: 0.079\n", "epoch: 16, batch: 3200 // loss: 0.074\n", "epoch: 16, batch: 3300 // loss: 0.072\n", "epoch: 16, batch: 3400 // loss: 0.070\n", "epoch: 16, batch: 3500 // loss: 0.072\n", "epoch: 16, batch: 3600 // loss: 0.080\n", "epoch: 16, batch: 3700 // loss: 0.083\n", "\n", "epoch: 17, batch: 0 // loss: 0.089\n", "epoch: 17, batch: 100 // loss: 0.076\n", "epoch: 17, batch: 200 // loss: 0.084\n", "epoch: 17, batch: 300 // loss: 0.079\n", "epoch: 17, batch: 400 // loss: 0.079\n", "epoch: 17, batch: 500 // loss: 0.070\n", "epoch: 17, batch: 600 // loss: 0.071\n", "epoch: 17, batch: 700 // loss: 0.075\n", "epoch: 17, batch: 800 // loss: 0.077\n", "epoch: 17, batch: 900 // loss: 0.086\n", "epoch: 17, batch: 1000 // loss: 0.071\n", "epoch: 17, batch: 1100 // loss: 0.078\n", "epoch: 17, batch: 1200 // loss: 0.076\n", "epoch: 17, batch: 1300 // loss: 0.081\n", "epoch: 17, batch: 1400 // loss: 0.075\n", "epoch: 17, batch: 1500 // loss: 0.077\n", "epoch: 17, batch: 1600 // loss: 0.082\n", "epoch: 17, batch: 1700 // loss: 0.079\n", "epoch: 17, batch: 1800 // loss: 0.082\n", "epoch: 17, batch: 1900 // loss: 0.078\n", "epoch: 17, batch: 2000 // loss: 0.073\n", "epoch: 17, batch: 2100 // loss: 0.080\n", "epoch: 17, batch: 2200 // loss: 0.085\n", "epoch: 17, batch: 2300 // loss: 0.080\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 17, batch: 2400 // loss: 0.074\n", "epoch: 17, batch: 2500 // loss: 0.069\n", "epoch: 17, batch: 2600 // loss: 0.080\n", "epoch: 17, batch: 2700 // loss: 0.069\n", "epoch: 17, batch: 2800 // loss: 0.085\n", "epoch: 17, batch: 2900 // loss: 0.069\n", "epoch: 17, batch: 3000 // loss: 0.072\n", "epoch: 17, batch: 3100 // loss: 0.077\n", "epoch: 17, batch: 3200 // loss: 0.072\n", "epoch: 17, batch: 3300 // loss: 0.070\n", "epoch: 17, batch: 3400 // loss: 0.069\n", "epoch: 17, batch: 3500 // loss: 0.070\n", "epoch: 17, batch: 3600 // loss: 0.078\n", "epoch: 17, batch: 3700 // loss: 0.082\n", "\n", "epoch: 18, batch: 0 // loss: 0.087\n", "epoch: 18, batch: 100 // loss: 0.075\n", "epoch: 18, batch: 200 // loss: 0.081\n", "epoch: 18, batch: 300 // loss: 0.078\n", "epoch: 18, batch: 400 // loss: 0.078\n", "epoch: 18, batch: 500 // loss: 0.069\n", "epoch: 18, batch: 600 // loss: 0.069\n", "epoch: 18, batch: 700 // loss: 0.073\n", "epoch: 18, batch: 800 // loss: 0.075\n", "epoch: 18, batch: 900 // loss: 0.084\n", "epoch: 18, batch: 1000 // loss: 0.070\n", "epoch: 18, batch: 1100 // loss: 0.075\n", "epoch: 18, batch: 1200 // loss: 0.075\n", "epoch: 18, batch: 1300 // loss: 0.079\n", "epoch: 18, batch: 1400 // loss: 0.073\n", "epoch: 18, batch: 1500 // loss: 0.076\n", "epoch: 18, batch: 1600 // loss: 0.080\n", "epoch: 18, batch: 1700 // loss: 0.076\n", "epoch: 18, batch: 1800 // loss: 0.081\n", "epoch: 18, batch: 1900 // loss: 0.076\n", "epoch: 18, batch: 2000 // loss: 0.072\n", "epoch: 18, batch: 2100 // loss: 0.079\n", "epoch: 18, batch: 2200 // loss: 0.083\n", "epoch: 18, batch: 2300 // loss: 0.078\n", "epoch: 18, batch: 2400 // loss: 0.073\n", "epoch: 18, batch: 2500 // loss: 0.068\n", "epoch: 18, batch: 2600 // loss: 0.078\n", "epoch: 18, batch: 2700 // loss: 0.068\n", "epoch: 18, batch: 2800 // loss: 0.083\n", "epoch: 18, batch: 2900 // loss: 0.068\n", "epoch: 18, batch: 3000 // loss: 0.070\n", "epoch: 18, batch: 3100 // loss: 0.076\n", "epoch: 18, batch: 3200 // loss: 0.071\n", "epoch: 18, batch: 3300 // loss: 0.069\n", "epoch: 18, batch: 3400 // loss: 0.068\n", "epoch: 18, batch: 3500 // loss: 0.068\n", "epoch: 18, batch: 3600 // loss: 0.076\n", "epoch: 18, batch: 3700 // loss: 0.080\n", "\n", "epoch: 19, batch: 0 // loss: 0.085\n", "epoch: 19, batch: 100 // loss: 0.073\n", "epoch: 19, batch: 200 // loss: 0.078\n", "epoch: 19, batch: 300 // loss: 0.076\n", "epoch: 19, batch: 400 // loss: 0.076\n", "epoch: 19, batch: 500 // loss: 0.067\n", "epoch: 19, batch: 600 // loss: 0.067\n", "epoch: 19, batch: 700 // loss: 0.071\n", "epoch: 19, batch: 800 // loss: 0.073\n", "epoch: 19, batch: 900 // loss: 0.082\n", "epoch: 19, batch: 1000 // loss: 0.068\n", "epoch: 19, batch: 1100 // loss: 0.073\n", "epoch: 19, batch: 1200 // loss: 0.074\n", "epoch: 19, batch: 1300 // loss: 0.077\n", "epoch: 19, batch: 1400 // loss: 0.071\n", "epoch: 19, batch: 1500 // loss: 0.074\n", "epoch: 19, batch: 1600 // loss: 0.078\n", "epoch: 19, batch: 1700 // loss: 0.074\n", "epoch: 19, batch: 1800 // loss: 0.079\n", "epoch: 19, batch: 1900 // loss: 0.075\n", "epoch: 19, batch: 2000 // loss: 0.071\n", "epoch: 19, batch: 2100 // loss: 0.077\n", "epoch: 19, batch: 2200 // loss: 0.081\n", "epoch: 19, batch: 2300 // loss: 0.076\n", "epoch: 19, batch: 2400 // loss: 0.071\n", "epoch: 19, batch: 2500 // loss: 0.067\n", "epoch: 19, batch: 2600 // loss: 0.075\n", "epoch: 19, batch: 2700 // loss: 0.067\n", "epoch: 19, batch: 2800 // loss: 0.081\n", "epoch: 19, batch: 2900 // loss: 0.067\n", "epoch: 19, batch: 3000 // loss: 0.068\n", "epoch: 19, batch: 3100 // loss: 0.074\n", "epoch: 19, batch: 3200 // loss: 0.069\n", "epoch: 19, batch: 3300 // loss: 0.067\n", "epoch: 19, batch: 3400 // loss: 0.067\n", "epoch: 19, batch: 3500 // loss: 0.065\n", "epoch: 19, batch: 3600 // loss: 0.073\n", "epoch: 19, batch: 3700 // loss: 0.077\n", "\n", "epoch: 20, batch: 0 // loss: 0.083\n", "epoch: 20, batch: 100 // loss: 0.072\n", "epoch: 20, batch: 200 // loss: 0.076\n", "epoch: 20, batch: 300 // loss: 0.075\n", "epoch: 20, batch: 400 // loss: 0.074\n", "epoch: 20, batch: 500 // loss: 0.065\n", "epoch: 20, batch: 600 // loss: 0.065\n", "epoch: 20, batch: 700 // loss: 0.069\n", "epoch: 20, batch: 800 // loss: 0.071\n", "epoch: 20, batch: 900 // loss: 0.080\n", "epoch: 20, batch: 1000 // loss: 0.067\n", "epoch: 20, batch: 1100 // loss: 0.071\n", "epoch: 20, batch: 1200 // loss: 0.072\n", "epoch: 20, batch: 1300 // loss: 0.075\n", "epoch: 20, batch: 1400 // loss: 0.069\n", "epoch: 20, batch: 1500 // loss: 0.073\n", "epoch: 20, batch: 1600 // loss: 0.077\n", "epoch: 20, batch: 1700 // loss: 0.071\n", "epoch: 20, batch: 1800 // loss: 0.077\n", "epoch: 20, batch: 1900 // loss: 0.073\n", "epoch: 20, batch: 2000 // loss: 0.070\n", "epoch: 20, batch: 2100 // loss: 0.075\n", "epoch: 20, batch: 2200 // loss: 0.079\n", "epoch: 20, batch: 2300 // loss: 0.074\n", "epoch: 20, batch: 2400 // loss: 0.069\n", "epoch: 20, batch: 2500 // loss: 0.065\n", "epoch: 20, batch: 2600 // loss: 0.073\n", "epoch: 20, batch: 2700 // loss: 0.065\n", "epoch: 20, batch: 2800 // loss: 0.079\n", "epoch: 20, batch: 2900 // loss: 0.065\n", "epoch: 20, batch: 3000 // loss: 0.066\n", "epoch: 20, batch: 3100 // loss: 0.072\n", "epoch: 20, batch: 3200 // loss: 0.067\n", "epoch: 20, batch: 3300 // loss: 0.065\n", "epoch: 20, batch: 3400 // loss: 0.066\n", "epoch: 20, batch: 3500 // loss: 0.063\n", "epoch: 20, batch: 3600 // loss: 0.071\n", "epoch: 20, batch: 3700 // loss: 0.075\n", "\n", "epoch: 21, batch: 0 // loss: 0.081\n", "epoch: 21, batch: 100 // loss: 0.071\n", "epoch: 21, batch: 200 // loss: 0.073\n", "epoch: 21, batch: 300 // loss: 0.073\n", "epoch: 21, batch: 400 // loss: 0.072\n", "epoch: 21, batch: 500 // loss: 0.063\n", "epoch: 21, batch: 600 // loss: 0.063\n", "epoch: 21, batch: 700 // loss: 0.067\n", "epoch: 21, batch: 800 // loss: 0.069\n", "epoch: 21, batch: 900 // loss: 0.078\n", "epoch: 21, batch: 1000 // loss: 0.065\n", "epoch: 21, batch: 1100 // loss: 0.068\n", "epoch: 21, batch: 1200 // loss: 0.071\n", "epoch: 21, batch: 1300 // loss: 0.074\n", "epoch: 21, batch: 1400 // loss: 0.068\n", "epoch: 21, batch: 1500 // loss: 0.072\n", "epoch: 21, batch: 1600 // loss: 0.075\n", "epoch: 21, batch: 1700 // loss: 0.069\n", "epoch: 21, batch: 1800 // loss: 0.076\n", "epoch: 21, batch: 1900 // loss: 0.071\n", "epoch: 21, batch: 2000 // loss: 0.069\n", "epoch: 21, batch: 2100 // loss: 0.074\n", "epoch: 21, batch: 2200 // loss: 0.077\n", "epoch: 21, batch: 2300 // loss: 0.072\n", "epoch: 21, batch: 2400 // loss: 0.067\n", "epoch: 21, batch: 2500 // loss: 0.064\n", "epoch: 21, batch: 2600 // loss: 0.070\n", "epoch: 21, batch: 2700 // loss: 0.064\n", "epoch: 21, batch: 2800 // loss: 0.077\n", "epoch: 21, batch: 2900 // loss: 0.064\n", "epoch: 21, batch: 3000 // loss: 0.065\n", "epoch: 21, batch: 3100 // loss: 0.070\n", "epoch: 21, batch: 3200 // loss: 0.065\n", "epoch: 21, batch: 3300 // loss: 0.063\n", "epoch: 21, batch: 3400 // loss: 0.064\n", "epoch: 21, batch: 3500 // loss: 0.061\n", "epoch: 21, batch: 3600 // loss: 0.068\n", "epoch: 21, batch: 3700 // loss: 0.073\n", "\n", "epoch: 22, batch: 0 // loss: 0.079\n", "epoch: 22, batch: 100 // loss: 0.070\n", "epoch: 22, batch: 200 // loss: 0.070\n", "epoch: 22, batch: 300 // loss: 0.072\n", "epoch: 22, batch: 400 // loss: 0.071\n", "epoch: 22, batch: 500 // loss: 0.061\n", "epoch: 22, batch: 600 // loss: 0.061\n", "epoch: 22, batch: 700 // loss: 0.065\n", "epoch: 22, batch: 800 // loss: 0.068\n", "epoch: 22, batch: 900 // loss: 0.076\n", "epoch: 22, batch: 1000 // loss: 0.064\n", "epoch: 22, batch: 1100 // loss: 0.066\n", "epoch: 22, batch: 1200 // loss: 0.069\n", "epoch: 22, batch: 1300 // loss: 0.072\n", "epoch: 22, batch: 1400 // loss: 0.066\n", "epoch: 22, batch: 1500 // loss: 0.071\n", "epoch: 22, batch: 1600 // loss: 0.073\n", "epoch: 22, batch: 1700 // loss: 0.067\n", "epoch: 22, batch: 1800 // loss: 0.074\n", "epoch: 22, batch: 1900 // loss: 0.070\n", "epoch: 22, batch: 2000 // loss: 0.069\n", "epoch: 22, batch: 2100 // loss: 0.072\n", "epoch: 22, batch: 2200 // loss: 0.075\n", "epoch: 22, batch: 2300 // loss: 0.071\n", "epoch: 22, batch: 2400 // loss: 0.066\n", "epoch: 22, batch: 2500 // loss: 0.063\n", "epoch: 22, batch: 2600 // loss: 0.068\n", "epoch: 22, batch: 2700 // loss: 0.062\n", "epoch: 22, batch: 2800 // loss: 0.076\n", "epoch: 22, batch: 2900 // loss: 0.062\n", "epoch: 22, batch: 3000 // loss: 0.063\n", "epoch: 22, batch: 3100 // loss: 0.068\n", "epoch: 22, batch: 3200 // loss: 0.064\n", "epoch: 22, batch: 3300 // loss: 0.061\n", "epoch: 22, batch: 3400 // loss: 0.063\n", "epoch: 22, batch: 3500 // loss: 0.059\n", "epoch: 22, batch: 3600 // loss: 0.066\n", "epoch: 22, batch: 3700 // loss: 0.071\n", "\n", "epoch: 23, batch: 0 // loss: 0.077\n", "epoch: 23, batch: 100 // loss: 0.069\n", "epoch: 23, batch: 200 // loss: 0.068\n", "epoch: 23, batch: 300 // loss: 0.070\n", "epoch: 23, batch: 400 // loss: 0.069\n", "epoch: 23, batch: 500 // loss: 0.059\n", "epoch: 23, batch: 600 // loss: 0.059\n", "epoch: 23, batch: 700 // loss: 0.063\n", "epoch: 23, batch: 800 // loss: 0.066\n", "epoch: 23, batch: 900 // loss: 0.074\n", "epoch: 23, batch: 1000 // loss: 0.063\n", "epoch: 23, batch: 1100 // loss: 0.064\n", "epoch: 23, batch: 1200 // loss: 0.068\n", "epoch: 23, batch: 1300 // loss: 0.070\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 23, batch: 1400 // loss: 0.064\n", "epoch: 23, batch: 1500 // loss: 0.069\n", "epoch: 23, batch: 1600 // loss: 0.072\n", "epoch: 23, batch: 1700 // loss: 0.065\n", "epoch: 23, batch: 1800 // loss: 0.073\n", "epoch: 23, batch: 1900 // loss: 0.069\n", "epoch: 23, batch: 2000 // loss: 0.068\n", "epoch: 23, batch: 2100 // loss: 0.071\n", "epoch: 23, batch: 2200 // loss: 0.073\n", "epoch: 23, batch: 2300 // loss: 0.069\n", "epoch: 23, batch: 2400 // loss: 0.064\n", "epoch: 23, batch: 2500 // loss: 0.061\n", "epoch: 23, batch: 2600 // loss: 0.066\n", "epoch: 23, batch: 2700 // loss: 0.061\n", "epoch: 23, batch: 2800 // loss: 0.074\n", "epoch: 23, batch: 2900 // loss: 0.061\n", "epoch: 23, batch: 3000 // loss: 0.061\n", "epoch: 23, batch: 3100 // loss: 0.067\n", "epoch: 23, batch: 3200 // loss: 0.062\n", "epoch: 23, batch: 3300 // loss: 0.060\n", "epoch: 23, batch: 3400 // loss: 0.062\n", "epoch: 23, batch: 3500 // loss: 0.057\n", "epoch: 23, batch: 3600 // loss: 0.064\n", "epoch: 23, batch: 3700 // loss: 0.070\n", "\n", "epoch: 24, batch: 0 // loss: 0.076\n", "epoch: 24, batch: 100 // loss: 0.068\n", "epoch: 24, batch: 200 // loss: 0.065\n", "epoch: 24, batch: 300 // loss: 0.069\n", "epoch: 24, batch: 400 // loss: 0.068\n", "epoch: 24, batch: 500 // loss: 0.058\n", "epoch: 24, batch: 600 // loss: 0.058\n", "epoch: 24, batch: 700 // loss: 0.062\n", "epoch: 24, batch: 800 // loss: 0.065\n", "epoch: 24, batch: 900 // loss: 0.072\n", "epoch: 24, batch: 1000 // loss: 0.061\n", "epoch: 24, batch: 1100 // loss: 0.062\n", "epoch: 24, batch: 1200 // loss: 0.067\n", "epoch: 24, batch: 1300 // loss: 0.069\n", "epoch: 24, batch: 1400 // loss: 0.063\n", "epoch: 24, batch: 1500 // loss: 0.068\n", "epoch: 24, batch: 1600 // loss: 0.070\n", "epoch: 24, batch: 1700 // loss: 0.063\n", "epoch: 24, batch: 1800 // loss: 0.071\n", "epoch: 24, batch: 1900 // loss: 0.067\n", "epoch: 24, batch: 2000 // loss: 0.067\n", "epoch: 24, batch: 2100 // loss: 0.070\n", "epoch: 24, batch: 2200 // loss: 0.072\n", "epoch: 24, batch: 2300 // loss: 0.068\n", "epoch: 24, batch: 2400 // loss: 0.062\n", "epoch: 24, batch: 2500 // loss: 0.060\n", "epoch: 24, batch: 2600 // loss: 0.065\n", "epoch: 24, batch: 2700 // loss: 0.060\n", "epoch: 24, batch: 2800 // loss: 0.072\n", "epoch: 24, batch: 2900 // loss: 0.060\n", "epoch: 24, batch: 3000 // loss: 0.060\n", "epoch: 24, batch: 3100 // loss: 0.065\n", "epoch: 24, batch: 3200 // loss: 0.061\n", "epoch: 24, batch: 3300 // loss: 0.059\n", "epoch: 24, batch: 3400 // loss: 0.061\n", "epoch: 24, batch: 3500 // loss: 0.056\n", "epoch: 24, batch: 3600 // loss: 0.062\n", "epoch: 24, batch: 3700 // loss: 0.068\n", "\n", "epoch: 25, batch: 0 // loss: 0.075\n", "epoch: 25, batch: 100 // loss: 0.067\n", "epoch: 25, batch: 200 // loss: 0.063\n", "epoch: 25, batch: 300 // loss: 0.068\n", "epoch: 25, batch: 400 // loss: 0.067\n", "epoch: 25, batch: 500 // loss: 0.057\n", "epoch: 25, batch: 600 // loss: 0.057\n", "epoch: 25, batch: 700 // loss: 0.060\n", "epoch: 25, batch: 800 // loss: 0.063\n", "epoch: 25, batch: 900 // loss: 0.071\n", "epoch: 25, batch: 1000 // loss: 0.060\n", "epoch: 25, batch: 1100 // loss: 0.061\n", "epoch: 25, batch: 1200 // loss: 0.066\n", "epoch: 25, batch: 1300 // loss: 0.068\n", "epoch: 25, batch: 1400 // loss: 0.061\n", "epoch: 25, batch: 1500 // loss: 0.068\n", "epoch: 25, batch: 1600 // loss: 0.069\n", "epoch: 25, batch: 1700 // loss: 0.061\n", "epoch: 25, batch: 1800 // loss: 0.070\n", "epoch: 25, batch: 1900 // loss: 0.066\n", "epoch: 25, batch: 2000 // loss: 0.066\n", "epoch: 25, batch: 2100 // loss: 0.069\n", "epoch: 25, batch: 2200 // loss: 0.071\n", "epoch: 25, batch: 2300 // loss: 0.067\n", "epoch: 25, batch: 2400 // loss: 0.061\n", "epoch: 25, batch: 2500 // loss: 0.060\n", "epoch: 25, batch: 2600 // loss: 0.063\n", "epoch: 25, batch: 2700 // loss: 0.059\n", "epoch: 25, batch: 2800 // loss: 0.071\n", "epoch: 25, batch: 2900 // loss: 0.059\n", "epoch: 25, batch: 3000 // loss: 0.059\n", "epoch: 25, batch: 3100 // loss: 0.064\n", "epoch: 25, batch: 3200 // loss: 0.059\n", "epoch: 25, batch: 3300 // loss: 0.057\n", "epoch: 25, batch: 3400 // loss: 0.061\n", "epoch: 25, batch: 3500 // loss: 0.055\n", "epoch: 25, batch: 3600 // loss: 0.060\n", "epoch: 25, batch: 3700 // loss: 0.067\n", "\n", "epoch: 26, batch: 0 // loss: 0.073\n", "epoch: 26, batch: 100 // loss: 0.067\n", "epoch: 26, batch: 200 // loss: 0.062\n", "epoch: 26, batch: 300 // loss: 0.067\n", "epoch: 26, batch: 400 // loss: 0.066\n", "epoch: 26, batch: 500 // loss: 0.055\n", "epoch: 26, batch: 600 // loss: 0.055\n", "epoch: 26, batch: 700 // loss: 0.059\n", "epoch: 26, batch: 800 // loss: 0.062\n", "epoch: 26, batch: 900 // loss: 0.070\n", "epoch: 26, batch: 1000 // loss: 0.060\n", "epoch: 26, batch: 1100 // loss: 0.060\n", "epoch: 26, batch: 1200 // loss: 0.065\n", "epoch: 26, batch: 1300 // loss: 0.067\n", "epoch: 26, batch: 1400 // loss: 0.060\n", "epoch: 26, batch: 1500 // loss: 0.067\n", "epoch: 26, batch: 1600 // loss: 0.068\n", "epoch: 26, batch: 1700 // loss: 0.060\n", "epoch: 26, batch: 1800 // loss: 0.069\n", "epoch: 26, batch: 1900 // loss: 0.065\n", "epoch: 26, batch: 2000 // loss: 0.066\n", "epoch: 26, batch: 2100 // loss: 0.068\n", "epoch: 26, batch: 2200 // loss: 0.070\n", "epoch: 26, batch: 2300 // loss: 0.066\n", "epoch: 26, batch: 2400 // loss: 0.060\n", "epoch: 26, batch: 2500 // loss: 0.059\n", "epoch: 26, batch: 2600 // loss: 0.062\n", "epoch: 26, batch: 2700 // loss: 0.058\n", "epoch: 26, batch: 2800 // loss: 0.070\n", "epoch: 26, batch: 2900 // loss: 0.058\n", "epoch: 26, batch: 3000 // loss: 0.058\n", "epoch: 26, batch: 3100 // loss: 0.063\n", "epoch: 26, batch: 3200 // loss: 0.058\n", "epoch: 26, batch: 3300 // loss: 0.056\n", "epoch: 26, batch: 3400 // loss: 0.060\n", "epoch: 26, batch: 3500 // loss: 0.053\n", "epoch: 26, batch: 3600 // loss: 0.059\n", "epoch: 26, batch: 3700 // loss: 0.066\n", "\n", "epoch: 27, batch: 0 // loss: 0.072\n", "epoch: 27, batch: 100 // loss: 0.066\n", "epoch: 27, batch: 200 // loss: 0.060\n", "epoch: 27, batch: 300 // loss: 0.066\n", "epoch: 27, batch: 400 // loss: 0.065\n", "epoch: 27, batch: 500 // loss: 0.054\n", "epoch: 27, batch: 600 // loss: 0.054\n", "epoch: 27, batch: 700 // loss: 0.058\n", "epoch: 27, batch: 800 // loss: 0.062\n", "epoch: 27, batch: 900 // loss: 0.069\n", "epoch: 27, batch: 1000 // loss: 0.059\n", "epoch: 27, batch: 1100 // loss: 0.058\n", "epoch: 27, batch: 1200 // loss: 0.064\n", "epoch: 27, batch: 1300 // loss: 0.067\n", "epoch: 27, batch: 1400 // loss: 0.059\n", "epoch: 27, batch: 1500 // loss: 0.066\n", "epoch: 27, batch: 1600 // loss: 0.067\n", "epoch: 27, batch: 1700 // loss: 0.059\n", "epoch: 27, batch: 1800 // loss: 0.069\n", "epoch: 27, batch: 1900 // loss: 0.065\n", "epoch: 27, batch: 2000 // loss: 0.065\n", "epoch: 27, batch: 2100 // loss: 0.067\n", "epoch: 27, batch: 2200 // loss: 0.069\n", "epoch: 27, batch: 2300 // loss: 0.065\n", "epoch: 27, batch: 2400 // loss: 0.059\n", "epoch: 27, batch: 2500 // loss: 0.058\n", "epoch: 27, batch: 2600 // loss: 0.061\n", "epoch: 27, batch: 2700 // loss: 0.058\n", "epoch: 27, batch: 2800 // loss: 0.069\n", "epoch: 27, batch: 2900 // loss: 0.058\n", "epoch: 27, batch: 3000 // loss: 0.057\n", "epoch: 27, batch: 3100 // loss: 0.062\n", "epoch: 27, batch: 3200 // loss: 0.057\n", "epoch: 27, batch: 3300 // loss: 0.056\n", "epoch: 27, batch: 3400 // loss: 0.059\n", "epoch: 27, batch: 3500 // loss: 0.053\n", "epoch: 27, batch: 3600 // loss: 0.058\n", "epoch: 27, batch: 3700 // loss: 0.065\n", "\n", "epoch: 28, batch: 0 // loss: 0.071\n", "epoch: 28, batch: 100 // loss: 0.066\n", "epoch: 28, batch: 200 // loss: 0.059\n", "epoch: 28, batch: 300 // loss: 0.066\n", "epoch: 28, batch: 400 // loss: 0.064\n", "epoch: 28, batch: 500 // loss: 0.054\n", "epoch: 28, batch: 600 // loss: 0.054\n", "epoch: 28, batch: 700 // loss: 0.057\n", "epoch: 28, batch: 800 // loss: 0.061\n", "epoch: 28, batch: 900 // loss: 0.068\n", "epoch: 28, batch: 1000 // loss: 0.058\n", "epoch: 28, batch: 1100 // loss: 0.058\n", "epoch: 28, batch: 1200 // loss: 0.063\n", "epoch: 28, batch: 1300 // loss: 0.066\n", "epoch: 28, batch: 1400 // loss: 0.059\n", "epoch: 28, batch: 1500 // loss: 0.065\n", "epoch: 28, batch: 1600 // loss: 0.066\n", "epoch: 28, batch: 1700 // loss: 0.059\n", "epoch: 28, batch: 1800 // loss: 0.068\n", "epoch: 28, batch: 1900 // loss: 0.064\n", "epoch: 28, batch: 2000 // loss: 0.065\n", "epoch: 28, batch: 2100 // loss: 0.066\n", "epoch: 28, batch: 2200 // loss: 0.068\n", "epoch: 28, batch: 2300 // loss: 0.065\n", "epoch: 28, batch: 2400 // loss: 0.058\n", "epoch: 28, batch: 2500 // loss: 0.058\n", "epoch: 28, batch: 2600 // loss: 0.060\n", "epoch: 28, batch: 2700 // loss: 0.057\n", "epoch: 28, batch: 2800 // loss: 0.068\n", "epoch: 28, batch: 2900 // loss: 0.057\n", "epoch: 28, batch: 3000 // loss: 0.056\n", "epoch: 28, batch: 3100 // loss: 0.061\n", "epoch: 28, batch: 3200 // loss: 0.056\n", "epoch: 28, batch: 3300 // loss: 0.055\n", "epoch: 28, batch: 3400 // loss: 0.059\n", "epoch: 28, batch: 3500 // loss: 0.052\n", "epoch: 28, batch: 3600 // loss: 0.057\n", "epoch: 28, batch: 3700 // loss: 0.064\n", "\n", "epoch: 29, batch: 0 // loss: 0.071\n", "epoch: 29, batch: 100 // loss: 0.065\n", "epoch: 29, batch: 200 // loss: 0.058\n", "epoch: 29, batch: 300 // loss: 0.065\n", "epoch: 29, batch: 400 // loss: 0.063\n", "epoch: 29, batch: 500 // loss: 0.053\n", "epoch: 29, batch: 600 // loss: 0.053\n", "epoch: 29, batch: 700 // loss: 0.056\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 29, batch: 800 // loss: 0.060\n", "epoch: 29, batch: 900 // loss: 0.068\n", "epoch: 29, batch: 1000 // loss: 0.058\n", "epoch: 29, batch: 1100 // loss: 0.057\n", "epoch: 29, batch: 1200 // loss: 0.063\n", "epoch: 29, batch: 1300 // loss: 0.066\n", "epoch: 29, batch: 1400 // loss: 0.058\n", "epoch: 29, batch: 1500 // loss: 0.065\n", "epoch: 29, batch: 1600 // loss: 0.066\n", "epoch: 29, batch: 1700 // loss: 0.058\n", "epoch: 29, batch: 1800 // loss: 0.067\n", "epoch: 29, batch: 1900 // loss: 0.063\n", "epoch: 29, batch: 2000 // loss: 0.064\n", "epoch: 29, batch: 2100 // loss: 0.066\n", "epoch: 29, batch: 2200 // loss: 0.068\n", "epoch: 29, batch: 2300 // loss: 0.064\n", "epoch: 29, batch: 2400 // loss: 0.057\n", "epoch: 29, batch: 2500 // loss: 0.057\n", "epoch: 29, batch: 2600 // loss: 0.059\n", "epoch: 29, batch: 2700 // loss: 0.057\n", "epoch: 29, batch: 2800 // loss: 0.068\n", "epoch: 29, batch: 2900 // loss: 0.057\n", "epoch: 29, batch: 3000 // loss: 0.056\n", "epoch: 29, batch: 3100 // loss: 0.061\n", "epoch: 29, batch: 3200 // loss: 0.056\n", "epoch: 29, batch: 3300 // loss: 0.054\n", "epoch: 29, batch: 3400 // loss: 0.059\n", "epoch: 29, batch: 3500 // loss: 0.051\n", "epoch: 29, batch: 3600 // loss: 0.056\n", "epoch: 29, batch: 3700 // loss: 0.063\n", "\n", "epoch: 30, batch: 0 // loss: 0.070\n", "epoch: 30, batch: 100 // loss: 0.065\n", "epoch: 30, batch: 200 // loss: 0.058\n", "epoch: 30, batch: 300 // loss: 0.065\n", "epoch: 30, batch: 400 // loss: 0.063\n", "epoch: 30, batch: 500 // loss: 0.052\n", "epoch: 30, batch: 600 // loss: 0.052\n", "epoch: 30, batch: 700 // loss: 0.056\n", "epoch: 30, batch: 800 // loss: 0.060\n", "epoch: 30, batch: 900 // loss: 0.067\n", "epoch: 30, batch: 1000 // loss: 0.057\n", "epoch: 30, batch: 1100 // loss: 0.056\n", "epoch: 30, batch: 1200 // loss: 0.062\n", "epoch: 30, batch: 1300 // loss: 0.065\n", "epoch: 30, batch: 1400 // loss: 0.057\n", "epoch: 30, batch: 1500 // loss: 0.064\n", "epoch: 30, batch: 1600 // loss: 0.065\n", "epoch: 30, batch: 1700 // loss: 0.058\n", "epoch: 30, batch: 1800 // loss: 0.067\n", "epoch: 30, batch: 1900 // loss: 0.063\n", "epoch: 30, batch: 2000 // loss: 0.064\n", "epoch: 30, batch: 2100 // loss: 0.065\n", "epoch: 30, batch: 2200 // loss: 0.067\n", "epoch: 30, batch: 2300 // loss: 0.064\n", "epoch: 30, batch: 2400 // loss: 0.056\n", "epoch: 30, batch: 2500 // loss: 0.057\n", "epoch: 30, batch: 2600 // loss: 0.058\n", "epoch: 30, batch: 2700 // loss: 0.056\n", "epoch: 30, batch: 2800 // loss: 0.067\n", "epoch: 30, batch: 2900 // loss: 0.056\n", "epoch: 30, batch: 3000 // loss: 0.055\n", "epoch: 30, batch: 3100 // loss: 0.060\n", "epoch: 30, batch: 3200 // loss: 0.055\n", "epoch: 30, batch: 3300 // loss: 0.054\n", "epoch: 30, batch: 3400 // loss: 0.058\n", "epoch: 30, batch: 3500 // loss: 0.051\n", "epoch: 30, batch: 3600 // loss: 0.055\n", "epoch: 30, batch: 3700 // loss: 0.063\n", "\n", "epoch: 31, batch: 0 // loss: 0.070\n", "epoch: 31, batch: 100 // loss: 0.065\n", "epoch: 31, batch: 200 // loss: 0.057\n", "epoch: 31, batch: 300 // loss: 0.064\n", "epoch: 31, batch: 400 // loss: 0.062\n", "epoch: 31, batch: 500 // loss: 0.052\n", "epoch: 31, batch: 600 // loss: 0.052\n", "epoch: 31, batch: 700 // loss: 0.055\n", "epoch: 31, batch: 800 // loss: 0.059\n", "epoch: 31, batch: 900 // loss: 0.066\n", "epoch: 31, batch: 1000 // loss: 0.057\n", "epoch: 31, batch: 1100 // loss: 0.056\n", "epoch: 31, batch: 1200 // loss: 0.062\n", "epoch: 31, batch: 1300 // loss: 0.065\n", "epoch: 31, batch: 1400 // loss: 0.057\n", "epoch: 31, batch: 1500 // loss: 0.064\n", "epoch: 31, batch: 1600 // loss: 0.064\n", "epoch: 31, batch: 1700 // loss: 0.057\n", "epoch: 31, batch: 1800 // loss: 0.067\n", "epoch: 31, batch: 1900 // loss: 0.062\n", "epoch: 31, batch: 2000 // loss: 0.064\n", "epoch: 31, batch: 2100 // loss: 0.065\n", "epoch: 31, batch: 2200 // loss: 0.067\n", "epoch: 31, batch: 2300 // loss: 0.063\n", "epoch: 31, batch: 2400 // loss: 0.056\n", "epoch: 31, batch: 2500 // loss: 0.056\n", "epoch: 31, batch: 2600 // loss: 0.058\n", "epoch: 31, batch: 2700 // loss: 0.056\n", "epoch: 31, batch: 2800 // loss: 0.067\n", "epoch: 31, batch: 2900 // loss: 0.056\n", "epoch: 31, batch: 3000 // loss: 0.055\n", "epoch: 31, batch: 3100 // loss: 0.059\n", "epoch: 31, batch: 3200 // loss: 0.054\n", "epoch: 31, batch: 3300 // loss: 0.053\n", "epoch: 31, batch: 3400 // loss: 0.058\n", "epoch: 31, batch: 3500 // loss: 0.050\n", "epoch: 31, batch: 3600 // loss: 0.055\n", "epoch: 31, batch: 3700 // loss: 0.062\n", "\n", "epoch: 32, batch: 0 // loss: 0.069\n", "epoch: 32, batch: 100 // loss: 0.065\n", "epoch: 32, batch: 200 // loss: 0.056\n", "epoch: 32, batch: 300 // loss: 0.064\n", "epoch: 32, batch: 400 // loss: 0.062\n", "epoch: 32, batch: 500 // loss: 0.051\n", "epoch: 32, batch: 600 // loss: 0.052\n", "epoch: 32, batch: 700 // loss: 0.055\n", "epoch: 32, batch: 800 // loss: 0.059\n", "epoch: 32, batch: 900 // loss: 0.066\n", "epoch: 32, batch: 1000 // loss: 0.056\n", "epoch: 32, batch: 1100 // loss: 0.055\n", "epoch: 32, batch: 1200 // loss: 0.061\n", "epoch: 32, batch: 1300 // loss: 0.065\n", "epoch: 32, batch: 1400 // loss: 0.056\n", "epoch: 32, batch: 1500 // loss: 0.063\n", "epoch: 32, batch: 1600 // loss: 0.064\n", "epoch: 32, batch: 1700 // loss: 0.057\n", "epoch: 32, batch: 1800 // loss: 0.066\n", "epoch: 32, batch: 1900 // loss: 0.062\n", "epoch: 32, batch: 2000 // loss: 0.063\n", "epoch: 32, batch: 2100 // loss: 0.064\n", "epoch: 32, batch: 2200 // loss: 0.067\n", "epoch: 32, batch: 2300 // loss: 0.063\n", "epoch: 32, batch: 2400 // loss: 0.055\n", "epoch: 32, batch: 2500 // loss: 0.056\n", "epoch: 32, batch: 2600 // loss: 0.057\n", "epoch: 32, batch: 2700 // loss: 0.056\n", "epoch: 32, batch: 2800 // loss: 0.066\n", "epoch: 32, batch: 2900 // loss: 0.055\n", "epoch: 32, batch: 3000 // loss: 0.055\n", "epoch: 32, batch: 3100 // loss: 0.059\n", "epoch: 32, batch: 3200 // loss: 0.054\n", "epoch: 32, batch: 3300 // loss: 0.053\n", "epoch: 32, batch: 3400 // loss: 0.057\n", "epoch: 32, batch: 3500 // loss: 0.050\n", "epoch: 32, batch: 3600 // loss: 0.054\n", "epoch: 32, batch: 3700 // loss: 0.061\n", "\n", "epoch: 33, batch: 0 // loss: 0.069\n", "epoch: 33, batch: 100 // loss: 0.064\n", "epoch: 33, batch: 200 // loss: 0.056\n", "epoch: 33, batch: 300 // loss: 0.063\n", "epoch: 33, batch: 400 // loss: 0.061\n", "epoch: 33, batch: 500 // loss: 0.051\n", "epoch: 33, batch: 600 // loss: 0.051\n", "epoch: 33, batch: 700 // loss: 0.054\n", "epoch: 33, batch: 800 // loss: 0.059\n", "epoch: 33, batch: 900 // loss: 0.065\n", "epoch: 33, batch: 1000 // loss: 0.056\n", "epoch: 33, batch: 1100 // loss: 0.055\n", "epoch: 33, batch: 1200 // loss: 0.061\n", "epoch: 33, batch: 1300 // loss: 0.064\n", "epoch: 33, batch: 1400 // loss: 0.056\n", "epoch: 33, batch: 1500 // loss: 0.063\n", "epoch: 33, batch: 1600 // loss: 0.064\n", "epoch: 33, batch: 1700 // loss: 0.056\n", "epoch: 33, batch: 1800 // loss: 0.066\n", "epoch: 33, batch: 1900 // loss: 0.062\n", "epoch: 33, batch: 2000 // loss: 0.063\n", "epoch: 33, batch: 2100 // loss: 0.064\n", "epoch: 33, batch: 2200 // loss: 0.066\n", "epoch: 33, batch: 2300 // loss: 0.063\n", "epoch: 33, batch: 2400 // loss: 0.055\n", "epoch: 33, batch: 2500 // loss: 0.056\n", "epoch: 33, batch: 2600 // loss: 0.057\n", "epoch: 33, batch: 2700 // loss: 0.055\n", "epoch: 33, batch: 2800 // loss: 0.065\n", "epoch: 33, batch: 2900 // loss: 0.055\n", "epoch: 33, batch: 3000 // loss: 0.054\n", "epoch: 33, batch: 3100 // loss: 0.058\n", "epoch: 33, batch: 3200 // loss: 0.053\n", "epoch: 33, batch: 3300 // loss: 0.052\n", "epoch: 33, batch: 3400 // loss: 0.057\n", "epoch: 33, batch: 3500 // loss: 0.049\n", "epoch: 33, batch: 3600 // loss: 0.054\n", "epoch: 33, batch: 3700 // loss: 0.061\n", "\n", "epoch: 34, batch: 0 // loss: 0.068\n", "epoch: 34, batch: 100 // loss: 0.064\n", "epoch: 34, batch: 200 // loss: 0.055\n", "epoch: 34, batch: 300 // loss: 0.063\n", "epoch: 34, batch: 400 // loss: 0.061\n", "epoch: 34, batch: 500 // loss: 0.050\n", "epoch: 34, batch: 600 // loss: 0.051\n", "epoch: 34, batch: 700 // loss: 0.054\n", "epoch: 34, batch: 800 // loss: 0.058\n", "epoch: 34, batch: 900 // loss: 0.065\n", "epoch: 34, batch: 1000 // loss: 0.055\n", "epoch: 34, batch: 1100 // loss: 0.054\n", "epoch: 34, batch: 1200 // loss: 0.060\n", "epoch: 34, batch: 1300 // loss: 0.064\n", "epoch: 34, batch: 1400 // loss: 0.055\n", "epoch: 34, batch: 1500 // loss: 0.062\n", "epoch: 34, batch: 1600 // loss: 0.063\n", "epoch: 34, batch: 1700 // loss: 0.056\n", "epoch: 34, batch: 1800 // loss: 0.065\n", "epoch: 34, batch: 1900 // loss: 0.061\n", "epoch: 34, batch: 2000 // loss: 0.062\n", "epoch: 34, batch: 2100 // loss: 0.063\n", "epoch: 34, batch: 2200 // loss: 0.066\n", "epoch: 34, batch: 2300 // loss: 0.062\n", "epoch: 34, batch: 2400 // loss: 0.054\n", "epoch: 34, batch: 2500 // loss: 0.055\n", "epoch: 34, batch: 2600 // loss: 0.057\n", "epoch: 34, batch: 2700 // loss: 0.055\n", "epoch: 34, batch: 2800 // loss: 0.065\n", "epoch: 34, batch: 2900 // loss: 0.054\n", "epoch: 34, batch: 3000 // loss: 0.054\n", "epoch: 34, batch: 3100 // loss: 0.058\n", "epoch: 34, batch: 3200 // loss: 0.053\n", "epoch: 34, batch: 3300 // loss: 0.052\n", "epoch: 34, batch: 3400 // loss: 0.057\n", "epoch: 34, batch: 3500 // loss: 0.049\n", "epoch: 34, batch: 3600 // loss: 0.053\n", "epoch: 34, batch: 3700 // loss: 0.060\n", "\n", "epoch: 35, batch: 0 // loss: 0.068\n", "epoch: 35, batch: 100 // loss: 0.064\n", "epoch: 35, batch: 200 // loss: 0.055\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 35, batch: 300 // loss: 0.062\n", "epoch: 35, batch: 400 // loss: 0.061\n", "epoch: 35, batch: 500 // loss: 0.050\n", "epoch: 35, batch: 600 // loss: 0.050\n", "epoch: 35, batch: 700 // loss: 0.054\n", "epoch: 35, batch: 800 // loss: 0.058\n", "epoch: 35, batch: 900 // loss: 0.064\n", "epoch: 35, batch: 1000 // loss: 0.055\n", "epoch: 35, batch: 1100 // loss: 0.054\n", "epoch: 35, batch: 1200 // loss: 0.060\n", "epoch: 35, batch: 1300 // loss: 0.063\n", "epoch: 35, batch: 1400 // loss: 0.055\n", "epoch: 35, batch: 1500 // loss: 0.062\n", "epoch: 35, batch: 1600 // loss: 0.063\n", "epoch: 35, batch: 1700 // loss: 0.056\n", "epoch: 35, batch: 1800 // loss: 0.065\n", "epoch: 35, batch: 1900 // loss: 0.061\n", "epoch: 35, batch: 2000 // loss: 0.062\n", "epoch: 35, batch: 2100 // loss: 0.063\n", "epoch: 35, batch: 2200 // loss: 0.065\n", "epoch: 35, batch: 2300 // loss: 0.062\n", "epoch: 35, batch: 2400 // loss: 0.054\n", "epoch: 35, batch: 2500 // loss: 0.055\n", "epoch: 35, batch: 2600 // loss: 0.056\n", "epoch: 35, batch: 2700 // loss: 0.054\n", "epoch: 35, batch: 2800 // loss: 0.064\n", "epoch: 35, batch: 2900 // loss: 0.054\n", "epoch: 35, batch: 3000 // loss: 0.054\n", "epoch: 35, batch: 3100 // loss: 0.057\n", "epoch: 35, batch: 3200 // loss: 0.052\n", "epoch: 35, batch: 3300 // loss: 0.051\n", "epoch: 35, batch: 3400 // loss: 0.056\n", "epoch: 35, batch: 3500 // loss: 0.048\n", "epoch: 35, batch: 3600 // loss: 0.053\n", "epoch: 35, batch: 3700 // loss: 0.060\n", "\n", "epoch: 36, batch: 0 // loss: 0.067\n", "epoch: 36, batch: 100 // loss: 0.063\n", "epoch: 36, batch: 200 // loss: 0.054\n", "epoch: 36, batch: 300 // loss: 0.062\n", "epoch: 36, batch: 400 // loss: 0.060\n", "epoch: 36, batch: 500 // loss: 0.050\n", "epoch: 36, batch: 600 // loss: 0.050\n", "epoch: 36, batch: 700 // loss: 0.053\n", "epoch: 36, batch: 800 // loss: 0.057\n", "epoch: 36, batch: 900 // loss: 0.064\n", "epoch: 36, batch: 1000 // loss: 0.055\n", "epoch: 36, batch: 1100 // loss: 0.054\n", "epoch: 36, batch: 1200 // loss: 0.059\n", "epoch: 36, batch: 1300 // loss: 0.063\n", "epoch: 36, batch: 1400 // loss: 0.054\n", "epoch: 36, batch: 1500 // loss: 0.061\n", "epoch: 36, batch: 1600 // loss: 0.062\n", "epoch: 36, batch: 1700 // loss: 0.056\n", "epoch: 36, batch: 1800 // loss: 0.064\n", "epoch: 36, batch: 1900 // loss: 0.060\n", "epoch: 36, batch: 2000 // loss: 0.061\n", "epoch: 36, batch: 2100 // loss: 0.062\n", "epoch: 36, batch: 2200 // loss: 0.065\n", "epoch: 36, batch: 2300 // loss: 0.062\n", "epoch: 36, batch: 2400 // loss: 0.053\n", "epoch: 36, batch: 2500 // loss: 0.055\n", "epoch: 36, batch: 2600 // loss: 0.056\n", "epoch: 36, batch: 2700 // loss: 0.054\n", "epoch: 36, batch: 2800 // loss: 0.064\n", "epoch: 36, batch: 2900 // loss: 0.054\n", "epoch: 36, batch: 3000 // loss: 0.053\n", "epoch: 36, batch: 3100 // loss: 0.057\n", "epoch: 36, batch: 3200 // loss: 0.051\n", "epoch: 36, batch: 3300 // loss: 0.051\n", "epoch: 36, batch: 3400 // loss: 0.056\n", "epoch: 36, batch: 3500 // loss: 0.048\n", "epoch: 36, batch: 3600 // loss: 0.053\n", "epoch: 36, batch: 3700 // loss: 0.059\n", "\n", "epoch: 37, batch: 0 // loss: 0.067\n", "epoch: 37, batch: 100 // loss: 0.063\n", "epoch: 37, batch: 200 // loss: 0.054\n", "epoch: 37, batch: 300 // loss: 0.061\n", "epoch: 37, batch: 400 // loss: 0.060\n", "epoch: 37, batch: 500 // loss: 0.049\n", "epoch: 37, batch: 600 // loss: 0.050\n", "epoch: 37, batch: 700 // loss: 0.053\n", "epoch: 37, batch: 800 // loss: 0.057\n", "epoch: 37, batch: 900 // loss: 0.063\n", "epoch: 37, batch: 1000 // loss: 0.054\n", "epoch: 37, batch: 1100 // loss: 0.053\n", "epoch: 37, batch: 1200 // loss: 0.058\n", "epoch: 37, batch: 1300 // loss: 0.062\n", "epoch: 37, batch: 1400 // loss: 0.054\n", "epoch: 37, batch: 1500 // loss: 0.061\n", "epoch: 37, batch: 1600 // loss: 0.062\n", "epoch: 37, batch: 1700 // loss: 0.055\n", "epoch: 37, batch: 1800 // loss: 0.064\n", "epoch: 37, batch: 1900 // loss: 0.060\n", "epoch: 37, batch: 2000 // loss: 0.061\n", "epoch: 37, batch: 2100 // loss: 0.062\n", "epoch: 37, batch: 2200 // loss: 0.065\n", "epoch: 37, batch: 2300 // loss: 0.061\n", "epoch: 37, batch: 2400 // loss: 0.052\n", "epoch: 37, batch: 2500 // loss: 0.054\n", "epoch: 37, batch: 2600 // loss: 0.055\n", "epoch: 37, batch: 2700 // loss: 0.054\n", "epoch: 37, batch: 2800 // loss: 0.063\n", "epoch: 37, batch: 2900 // loss: 0.053\n", "epoch: 37, batch: 3000 // loss: 0.053\n", "epoch: 37, batch: 3100 // loss: 0.056\n", "epoch: 37, batch: 3200 // loss: 0.051\n", "epoch: 37, batch: 3300 // loss: 0.050\n", "epoch: 37, batch: 3400 // loss: 0.055\n", "epoch: 37, batch: 3500 // loss: 0.047\n", "epoch: 37, batch: 3600 // loss: 0.052\n", "epoch: 37, batch: 3700 // loss: 0.058\n", "\n", "epoch: 38, batch: 0 // loss: 0.066\n", "epoch: 38, batch: 100 // loss: 0.062\n", "epoch: 38, batch: 200 // loss: 0.053\n", "epoch: 38, batch: 300 // loss: 0.061\n", "epoch: 38, batch: 400 // loss: 0.059\n", "epoch: 38, batch: 500 // loss: 0.049\n", "epoch: 38, batch: 600 // loss: 0.049\n", "epoch: 38, batch: 700 // loss: 0.052\n", "epoch: 38, batch: 800 // loss: 0.056\n", "epoch: 38, batch: 900 // loss: 0.063\n", "epoch: 38, batch: 1000 // loss: 0.054\n", "epoch: 38, batch: 1100 // loss: 0.053\n", "epoch: 38, batch: 1200 // loss: 0.058\n", "epoch: 38, batch: 1300 // loss: 0.062\n", "epoch: 38, batch: 1400 // loss: 0.053\n", "epoch: 38, batch: 1500 // loss: 0.060\n", "epoch: 38, batch: 1600 // loss: 0.061\n", "epoch: 38, batch: 1700 // loss: 0.055\n", "epoch: 38, batch: 1800 // loss: 0.063\n", "epoch: 38, batch: 1900 // loss: 0.059\n", "epoch: 38, batch: 2000 // loss: 0.060\n", "epoch: 38, batch: 2100 // loss: 0.061\n", "epoch: 38, batch: 2200 // loss: 0.064\n", "epoch: 38, batch: 2300 // loss: 0.061\n", "epoch: 38, batch: 2400 // loss: 0.052\n", "epoch: 38, batch: 2500 // loss: 0.054\n", "epoch: 38, batch: 2600 // loss: 0.055\n", "epoch: 38, batch: 2700 // loss: 0.053\n", "epoch: 38, batch: 2800 // loss: 0.062\n", "epoch: 38, batch: 2900 // loss: 0.053\n", "epoch: 38, batch: 3000 // loss: 0.053\n", "epoch: 38, batch: 3100 // loss: 0.056\n", "epoch: 38, batch: 3200 // loss: 0.050\n", "epoch: 38, batch: 3300 // loss: 0.050\n", "epoch: 38, batch: 3400 // loss: 0.055\n", "epoch: 38, batch: 3500 // loss: 0.047\n", "epoch: 38, batch: 3600 // loss: 0.052\n", "epoch: 38, batch: 3700 // loss: 0.058\n", "\n", "epoch: 39, batch: 0 // loss: 0.066\n", "epoch: 39, batch: 100 // loss: 0.062\n", "epoch: 39, batch: 200 // loss: 0.053\n", "epoch: 39, batch: 300 // loss: 0.060\n", "epoch: 39, batch: 400 // loss: 0.059\n", "epoch: 39, batch: 500 // loss: 0.048\n", "epoch: 39, batch: 600 // loss: 0.049\n", "epoch: 39, batch: 700 // loss: 0.052\n", "epoch: 39, batch: 800 // loss: 0.056\n", "epoch: 39, batch: 900 // loss: 0.062\n", "epoch: 39, batch: 1000 // loss: 0.053\n", "epoch: 39, batch: 1100 // loss: 0.052\n", "epoch: 39, batch: 1200 // loss: 0.057\n", "epoch: 39, batch: 1300 // loss: 0.061\n", "epoch: 39, batch: 1400 // loss: 0.053\n", "epoch: 39, batch: 1500 // loss: 0.060\n", "epoch: 39, batch: 1600 // loss: 0.061\n", "epoch: 39, batch: 1700 // loss: 0.055\n", "epoch: 39, batch: 1800 // loss: 0.063\n", "epoch: 39, batch: 1900 // loss: 0.058\n", "epoch: 39, batch: 2000 // loss: 0.060\n", "epoch: 39, batch: 2100 // loss: 0.060\n", "epoch: 39, batch: 2200 // loss: 0.063\n", "epoch: 39, batch: 2300 // loss: 0.060\n", "epoch: 39, batch: 2400 // loss: 0.051\n", "epoch: 39, batch: 2500 // loss: 0.053\n", "epoch: 39, batch: 2600 // loss: 0.054\n", "epoch: 39, batch: 2700 // loss: 0.053\n", "epoch: 39, batch: 2800 // loss: 0.061\n", "epoch: 39, batch: 2900 // loss: 0.052\n", "epoch: 39, batch: 3000 // loss: 0.052\n", "epoch: 39, batch: 3100 // loss: 0.055\n", "epoch: 39, batch: 3200 // loss: 0.050\n", "epoch: 39, batch: 3300 // loss: 0.049\n", "epoch: 39, batch: 3400 // loss: 0.054\n", "epoch: 39, batch: 3500 // loss: 0.046\n", "epoch: 39, batch: 3600 // loss: 0.051\n", "epoch: 39, batch: 3700 // loss: 0.057\n", "\n", "epoch: 40, batch: 0 // loss: 0.065\n", "epoch: 40, batch: 100 // loss: 0.061\n", "epoch: 40, batch: 200 // loss: 0.052\n", "epoch: 40, batch: 300 // loss: 0.060\n", "epoch: 40, batch: 400 // loss: 0.058\n", "epoch: 40, batch: 500 // loss: 0.048\n", "epoch: 40, batch: 600 // loss: 0.048\n", "epoch: 40, batch: 700 // loss: 0.052\n", "epoch: 40, batch: 800 // loss: 0.055\n", "epoch: 40, batch: 900 // loss: 0.061\n", "epoch: 40, batch: 1000 // loss: 0.053\n", "epoch: 40, batch: 1100 // loss: 0.052\n", "epoch: 40, batch: 1200 // loss: 0.056\n", "epoch: 40, batch: 1300 // loss: 0.060\n", "epoch: 40, batch: 1400 // loss: 0.052\n", "epoch: 40, batch: 1500 // loss: 0.059\n", "epoch: 40, batch: 1600 // loss: 0.060\n", "epoch: 40, batch: 1700 // loss: 0.054\n", "epoch: 40, batch: 1800 // loss: 0.062\n", "epoch: 40, batch: 1900 // loss: 0.058\n", "epoch: 40, batch: 2000 // loss: 0.059\n", "epoch: 40, batch: 2100 // loss: 0.060\n", "epoch: 40, batch: 2200 // loss: 0.063\n", "epoch: 40, batch: 2300 // loss: 0.060\n", "epoch: 40, batch: 2400 // loss: 0.051\n", "epoch: 40, batch: 2500 // loss: 0.053\n", "epoch: 40, batch: 2600 // loss: 0.054\n", "epoch: 40, batch: 2700 // loss: 0.052\n", "epoch: 40, batch: 2800 // loss: 0.060\n", "epoch: 40, batch: 2900 // loss: 0.052\n", "epoch: 40, batch: 3000 // loss: 0.052\n", "epoch: 40, batch: 3100 // loss: 0.054\n", "epoch: 40, batch: 3200 // loss: 0.049\n", "epoch: 40, batch: 3300 // loss: 0.048\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 40, batch: 3400 // loss: 0.054\n", "epoch: 40, batch: 3500 // loss: 0.046\n", "epoch: 40, batch: 3600 // loss: 0.051\n", "epoch: 40, batch: 3700 // loss: 0.056\n", "\n", "epoch: 41, batch: 0 // loss: 0.065\n", "epoch: 41, batch: 100 // loss: 0.060\n", "epoch: 41, batch: 200 // loss: 0.052\n", "epoch: 41, batch: 300 // loss: 0.059\n", "epoch: 41, batch: 400 // loss: 0.057\n", "epoch: 41, batch: 500 // loss: 0.047\n", "epoch: 41, batch: 600 // loss: 0.048\n", "epoch: 41, batch: 700 // loss: 0.051\n", "epoch: 41, batch: 800 // loss: 0.054\n", "epoch: 41, batch: 900 // loss: 0.061\n", "epoch: 41, batch: 1000 // loss: 0.052\n", "epoch: 41, batch: 1100 // loss: 0.051\n", "epoch: 41, batch: 1200 // loss: 0.056\n", "epoch: 41, batch: 1300 // loss: 0.060\n", "epoch: 41, batch: 1400 // loss: 0.051\n", "epoch: 41, batch: 1500 // loss: 0.058\n", "epoch: 41, batch: 1600 // loss: 0.060\n", "epoch: 41, batch: 1700 // loss: 0.054\n", "epoch: 41, batch: 1800 // loss: 0.062\n", "epoch: 41, batch: 1900 // loss: 0.057\n", "epoch: 41, batch: 2000 // loss: 0.058\n", "epoch: 41, batch: 2100 // loss: 0.059\n", "epoch: 41, batch: 2200 // loss: 0.062\n", "epoch: 41, batch: 2300 // loss: 0.059\n", "epoch: 41, batch: 2400 // loss: 0.050\n", "epoch: 41, batch: 2500 // loss: 0.052\n", "epoch: 41, batch: 2600 // loss: 0.053\n", "epoch: 41, batch: 2700 // loss: 0.051\n", "epoch: 41, batch: 2800 // loss: 0.060\n", "epoch: 41, batch: 2900 // loss: 0.051\n", "epoch: 41, batch: 3000 // loss: 0.052\n", "epoch: 41, batch: 3100 // loss: 0.054\n", "epoch: 41, batch: 3200 // loss: 0.048\n", "epoch: 41, batch: 3300 // loss: 0.048\n", "epoch: 41, batch: 3400 // loss: 0.053\n", "epoch: 41, batch: 3500 // loss: 0.045\n", "epoch: 41, batch: 3600 // loss: 0.050\n", "epoch: 41, batch: 3700 // loss: 0.055\n", "\n", "epoch: 42, batch: 0 // loss: 0.064\n", "epoch: 42, batch: 100 // loss: 0.060\n", "epoch: 42, batch: 200 // loss: 0.051\n", "epoch: 42, batch: 300 // loss: 0.058\n", "epoch: 42, batch: 400 // loss: 0.057\n", "epoch: 42, batch: 500 // loss: 0.047\n", "epoch: 42, batch: 600 // loss: 0.048\n", "epoch: 42, batch: 700 // loss: 0.051\n", "epoch: 42, batch: 800 // loss: 0.053\n", "epoch: 42, batch: 900 // loss: 0.060\n", "epoch: 42, batch: 1000 // loss: 0.052\n", "epoch: 42, batch: 1100 // loss: 0.051\n", "epoch: 42, batch: 1200 // loss: 0.055\n", "epoch: 42, batch: 1300 // loss: 0.059\n", "epoch: 42, batch: 1400 // loss: 0.051\n", "epoch: 42, batch: 1500 // loss: 0.058\n", "epoch: 42, batch: 1600 // loss: 0.059\n", "epoch: 42, batch: 1700 // loss: 0.053\n", "epoch: 42, batch: 1800 // loss: 0.061\n", "epoch: 42, batch: 1900 // loss: 0.056\n", "epoch: 42, batch: 2000 // loss: 0.057\n", "epoch: 42, batch: 2100 // loss: 0.058\n", "epoch: 42, batch: 2200 // loss: 0.061\n", "epoch: 42, batch: 2300 // loss: 0.059\n", "epoch: 42, batch: 2400 // loss: 0.050\n", "epoch: 42, batch: 2500 // loss: 0.052\n", "epoch: 42, batch: 2600 // loss: 0.053\n", "epoch: 42, batch: 2700 // loss: 0.051\n", "epoch: 42, batch: 2800 // loss: 0.059\n", "epoch: 42, batch: 2900 // loss: 0.050\n", "epoch: 42, batch: 3000 // loss: 0.051\n", "epoch: 42, batch: 3100 // loss: 0.053\n", "epoch: 42, batch: 3200 // loss: 0.048\n", "epoch: 42, batch: 3300 // loss: 0.047\n", "epoch: 42, batch: 3400 // loss: 0.052\n", "epoch: 42, batch: 3500 // loss: 0.044\n", "epoch: 42, batch: 3600 // loss: 0.050\n", "epoch: 42, batch: 3700 // loss: 0.055\n", "\n", "epoch: 43, batch: 0 // loss: 0.063\n", "epoch: 43, batch: 100 // loss: 0.059\n", "epoch: 43, batch: 200 // loss: 0.050\n", "epoch: 43, batch: 300 // loss: 0.058\n", "epoch: 43, batch: 400 // loss: 0.056\n", "epoch: 43, batch: 500 // loss: 0.046\n", "epoch: 43, batch: 600 // loss: 0.047\n", "epoch: 43, batch: 700 // loss: 0.050\n", "epoch: 43, batch: 800 // loss: 0.053\n", "epoch: 43, batch: 900 // loss: 0.059\n", "epoch: 43, batch: 1000 // loss: 0.051\n", "epoch: 43, batch: 1100 // loss: 0.050\n", "epoch: 43, batch: 1200 // loss: 0.054\n", "epoch: 43, batch: 1300 // loss: 0.058\n", "epoch: 43, batch: 1400 // loss: 0.050\n", "epoch: 43, batch: 1500 // loss: 0.057\n", "epoch: 43, batch: 1600 // loss: 0.059\n", "epoch: 43, batch: 1700 // loss: 0.053\n", "epoch: 43, batch: 1800 // loss: 0.060\n", "epoch: 43, batch: 1900 // loss: 0.055\n", "epoch: 43, batch: 2000 // loss: 0.056\n", "epoch: 43, batch: 2100 // loss: 0.057\n", "epoch: 43, batch: 2200 // loss: 0.060\n", "epoch: 43, batch: 2300 // loss: 0.058\n", "epoch: 43, batch: 2400 // loss: 0.049\n", "epoch: 43, batch: 2500 // loss: 0.051\n", "epoch: 43, batch: 2600 // loss: 0.052\n", "epoch: 43, batch: 2700 // loss: 0.050\n", "epoch: 43, batch: 2800 // loss: 0.058\n", "epoch: 43, batch: 2900 // loss: 0.050\n", "epoch: 43, batch: 3000 // loss: 0.051\n", "epoch: 43, batch: 3100 // loss: 0.052\n", "epoch: 43, batch: 3200 // loss: 0.047\n", "epoch: 43, batch: 3300 // loss: 0.046\n", "epoch: 43, batch: 3400 // loss: 0.052\n", "epoch: 43, batch: 3500 // loss: 0.044\n", "epoch: 43, batch: 3600 // loss: 0.049\n", "epoch: 43, batch: 3700 // loss: 0.054\n", "\n", "epoch: 44, batch: 0 // loss: 0.063\n", "epoch: 44, batch: 100 // loss: 0.058\n", "epoch: 44, batch: 200 // loss: 0.050\n", "epoch: 44, batch: 300 // loss: 0.057\n", "epoch: 44, batch: 400 // loss: 0.055\n", "epoch: 44, batch: 500 // loss: 0.046\n", "epoch: 44, batch: 600 // loss: 0.047\n", "epoch: 44, batch: 700 // loss: 0.050\n", "epoch: 44, batch: 800 // loss: 0.052\n", "epoch: 44, batch: 900 // loss: 0.058\n", "epoch: 44, batch: 1000 // loss: 0.051\n", "epoch: 44, batch: 1100 // loss: 0.050\n", "epoch: 44, batch: 1200 // loss: 0.053\n", "epoch: 44, batch: 1300 // loss: 0.057\n", "epoch: 44, batch: 1400 // loss: 0.050\n", "epoch: 44, batch: 1500 // loss: 0.056\n", "epoch: 44, batch: 1600 // loss: 0.058\n", "epoch: 44, batch: 1700 // loss: 0.052\n", "epoch: 44, batch: 1800 // loss: 0.060\n", "epoch: 44, batch: 1900 // loss: 0.055\n", "epoch: 44, batch: 2000 // loss: 0.056\n", "epoch: 44, batch: 2100 // loss: 0.056\n", "epoch: 44, batch: 2200 // loss: 0.060\n", "epoch: 44, batch: 2300 // loss: 0.057\n", "epoch: 44, batch: 2400 // loss: 0.048\n", "epoch: 44, batch: 2500 // loss: 0.050\n", "epoch: 44, batch: 2600 // loss: 0.052\n", "epoch: 44, batch: 2700 // loss: 0.050\n", "epoch: 44, batch: 2800 // loss: 0.057\n", "epoch: 44, batch: 2900 // loss: 0.049\n", "epoch: 44, batch: 3000 // loss: 0.051\n", "epoch: 44, batch: 3100 // loss: 0.051\n", "epoch: 44, batch: 3200 // loss: 0.046\n", "epoch: 44, batch: 3300 // loss: 0.046\n", "epoch: 44, batch: 3400 // loss: 0.051\n", "epoch: 44, batch: 3500 // loss: 0.043\n", "epoch: 44, batch: 3600 // loss: 0.049\n", "epoch: 44, batch: 3700 // loss: 0.053\n", "\n", "epoch: 45, batch: 0 // loss: 0.062\n", "epoch: 45, batch: 100 // loss: 0.057\n", "epoch: 45, batch: 200 // loss: 0.049\n", "epoch: 45, batch: 300 // loss: 0.056\n", "epoch: 45, batch: 400 // loss: 0.055\n", "epoch: 45, batch: 500 // loss: 0.045\n", "epoch: 45, batch: 600 // loss: 0.046\n", "epoch: 45, batch: 700 // loss: 0.049\n", "epoch: 45, batch: 800 // loss: 0.051\n", "epoch: 45, batch: 900 // loss: 0.057\n", "epoch: 45, batch: 1000 // loss: 0.050\n", "epoch: 45, batch: 1100 // loss: 0.049\n", "epoch: 45, batch: 1200 // loss: 0.052\n", "epoch: 45, batch: 1300 // loss: 0.056\n", "epoch: 45, batch: 1400 // loss: 0.049\n", "epoch: 45, batch: 1500 // loss: 0.056\n", "epoch: 45, batch: 1600 // loss: 0.057\n", "epoch: 45, batch: 1700 // loss: 0.052\n", "epoch: 45, batch: 1800 // loss: 0.059\n", "epoch: 45, batch: 1900 // loss: 0.054\n", "epoch: 45, batch: 2000 // loss: 0.055\n", "epoch: 45, batch: 2100 // loss: 0.056\n", "epoch: 45, batch: 2200 // loss: 0.059\n", "epoch: 45, batch: 2300 // loss: 0.057\n", "epoch: 45, batch: 2400 // loss: 0.048\n", "epoch: 45, batch: 2500 // loss: 0.050\n", "epoch: 45, batch: 2600 // loss: 0.051\n", "epoch: 45, batch: 2700 // loss: 0.049\n", "epoch: 45, batch: 2800 // loss: 0.056\n", "epoch: 45, batch: 2900 // loss: 0.049\n", "epoch: 45, batch: 3000 // loss: 0.050\n", "epoch: 45, batch: 3100 // loss: 0.051\n", "epoch: 45, batch: 3200 // loss: 0.046\n", "epoch: 45, batch: 3300 // loss: 0.045\n", "epoch: 45, batch: 3400 // loss: 0.051\n", "epoch: 45, batch: 3500 // loss: 0.042\n", "epoch: 45, batch: 3600 // loss: 0.048\n", "epoch: 45, batch: 3700 // loss: 0.052\n", "\n", "epoch: 46, batch: 0 // loss: 0.061\n", "epoch: 46, batch: 100 // loss: 0.056\n", "epoch: 46, batch: 200 // loss: 0.049\n", "epoch: 46, batch: 300 // loss: 0.055\n", "epoch: 46, batch: 400 // loss: 0.054\n", "epoch: 46, batch: 500 // loss: 0.045\n", "epoch: 46, batch: 600 // loss: 0.046\n", "epoch: 46, batch: 700 // loss: 0.049\n", "epoch: 46, batch: 800 // loss: 0.050\n", "epoch: 46, batch: 900 // loss: 0.057\n", "epoch: 46, batch: 1000 // loss: 0.050\n", "epoch: 46, batch: 1100 // loss: 0.049\n", "epoch: 46, batch: 1200 // loss: 0.052\n", "epoch: 46, batch: 1300 // loss: 0.055\n", "epoch: 46, batch: 1400 // loss: 0.048\n", "epoch: 46, batch: 1500 // loss: 0.055\n", "epoch: 46, batch: 1600 // loss: 0.057\n", "epoch: 46, batch: 1700 // loss: 0.051\n", "epoch: 46, batch: 1800 // loss: 0.059\n", "epoch: 46, batch: 1900 // loss: 0.053\n", "epoch: 46, batch: 2000 // loss: 0.054\n", "epoch: 46, batch: 2100 // loss: 0.055\n", "epoch: 46, batch: 2200 // loss: 0.058\n", "epoch: 46, batch: 2300 // loss: 0.056\n", "epoch: 46, batch: 2400 // loss: 0.047\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 46, batch: 2500 // loss: 0.049\n", "epoch: 46, batch: 2600 // loss: 0.051\n", "epoch: 46, batch: 2700 // loss: 0.048\n", "epoch: 46, batch: 2800 // loss: 0.055\n", "epoch: 46, batch: 2900 // loss: 0.048\n", "epoch: 46, batch: 3000 // loss: 0.050\n", "epoch: 46, batch: 3100 // loss: 0.050\n", "epoch: 46, batch: 3200 // loss: 0.045\n", "epoch: 46, batch: 3300 // loss: 0.044\n", "epoch: 46, batch: 3400 // loss: 0.050\n", "epoch: 46, batch: 3500 // loss: 0.042\n", "epoch: 46, batch: 3600 // loss: 0.048\n", "epoch: 46, batch: 3700 // loss: 0.051\n", "\n", "epoch: 47, batch: 0 // loss: 0.060\n", "epoch: 47, batch: 100 // loss: 0.055\n", "epoch: 47, batch: 200 // loss: 0.048\n", "epoch: 47, batch: 300 // loss: 0.055\n", "epoch: 47, batch: 400 // loss: 0.053\n", "epoch: 47, batch: 500 // loss: 0.044\n", "epoch: 47, batch: 600 // loss: 0.045\n", "epoch: 47, batch: 700 // loss: 0.048\n", "epoch: 47, batch: 800 // loss: 0.050\n", "epoch: 47, batch: 900 // loss: 0.056\n", "epoch: 47, batch: 1000 // loss: 0.050\n", "epoch: 47, batch: 1100 // loss: 0.048\n", "epoch: 47, batch: 1200 // loss: 0.051\n", "epoch: 47, batch: 1300 // loss: 0.054\n", "epoch: 47, batch: 1400 // loss: 0.048\n", "epoch: 47, batch: 1500 // loss: 0.054\n", "epoch: 47, batch: 1600 // loss: 0.056\n", "epoch: 47, batch: 1700 // loss: 0.050\n", "epoch: 47, batch: 1800 // loss: 0.058\n", "epoch: 47, batch: 1900 // loss: 0.052\n", "epoch: 47, batch: 2000 // loss: 0.053\n", "epoch: 47, batch: 2100 // loss: 0.054\n", "epoch: 47, batch: 2200 // loss: 0.057\n", "epoch: 47, batch: 2300 // loss: 0.055\n", "epoch: 47, batch: 2400 // loss: 0.047\n", "epoch: 47, batch: 2500 // loss: 0.049\n", "epoch: 47, batch: 2600 // loss: 0.050\n", "epoch: 47, batch: 2700 // loss: 0.048\n", "epoch: 47, batch: 2800 // loss: 0.054\n", "epoch: 47, batch: 2900 // loss: 0.047\n", "epoch: 47, batch: 3000 // loss: 0.049\n", "epoch: 47, batch: 3100 // loss: 0.049\n", "epoch: 47, batch: 3200 // loss: 0.044\n", "epoch: 47, batch: 3300 // loss: 0.044\n", "epoch: 47, batch: 3400 // loss: 0.049\n", "epoch: 47, batch: 3500 // loss: 0.041\n", "epoch: 47, batch: 3600 // loss: 0.047\n", "epoch: 47, batch: 3700 // loss: 0.050\n", "\n", "epoch: 48, batch: 0 // loss: 0.060\n", "epoch: 48, batch: 100 // loss: 0.055\n", "epoch: 48, batch: 200 // loss: 0.047\n", "epoch: 48, batch: 300 // loss: 0.054\n", "epoch: 48, batch: 400 // loss: 0.052\n", "epoch: 48, batch: 500 // loss: 0.044\n", "epoch: 48, batch: 600 // loss: 0.045\n", "epoch: 48, batch: 700 // loss: 0.048\n", "epoch: 48, batch: 800 // loss: 0.049\n", "epoch: 48, batch: 900 // loss: 0.055\n", "epoch: 48, batch: 1000 // loss: 0.049\n", "epoch: 48, batch: 1100 // loss: 0.048\n", "epoch: 48, batch: 1200 // loss: 0.050\n", "epoch: 48, batch: 1300 // loss: 0.053\n", "epoch: 48, batch: 1400 // loss: 0.047\n", "epoch: 48, batch: 1500 // loss: 0.054\n", "epoch: 48, batch: 1600 // loss: 0.056\n", "epoch: 48, batch: 1700 // loss: 0.050\n", "epoch: 48, batch: 1800 // loss: 0.057\n", "epoch: 48, batch: 1900 // loss: 0.052\n", "epoch: 48, batch: 2000 // loss: 0.052\n", "epoch: 48, batch: 2100 // loss: 0.053\n", "epoch: 48, batch: 2200 // loss: 0.056\n", "epoch: 48, batch: 2300 // loss: 0.055\n", "epoch: 48, batch: 2400 // loss: 0.046\n", "epoch: 48, batch: 2500 // loss: 0.048\n", "epoch: 48, batch: 2600 // loss: 0.049\n", "epoch: 48, batch: 2700 // loss: 0.047\n", "epoch: 48, batch: 2800 // loss: 0.053\n", "epoch: 48, batch: 2900 // loss: 0.047\n", "epoch: 48, batch: 3000 // loss: 0.049\n", "epoch: 48, batch: 3100 // loss: 0.049\n", "epoch: 48, batch: 3200 // loss: 0.044\n", "epoch: 48, batch: 3300 // loss: 0.043\n", "epoch: 48, batch: 3400 // loss: 0.049\n", "epoch: 48, batch: 3500 // loss: 0.040\n", "epoch: 48, batch: 3600 // loss: 0.047\n", "epoch: 48, batch: 3700 // loss: 0.050\n", "\n", "epoch: 49, batch: 0 // loss: 0.059\n", "epoch: 49, batch: 100 // loss: 0.054\n", "epoch: 49, batch: 200 // loss: 0.047\n", "epoch: 49, batch: 300 // loss: 0.054\n", "epoch: 49, batch: 400 // loss: 0.052\n", "epoch: 49, batch: 500 // loss: 0.043\n", "epoch: 49, batch: 600 // loss: 0.044\n", "epoch: 49, batch: 700 // loss: 0.048\n", "epoch: 49, batch: 800 // loss: 0.048\n", "epoch: 49, batch: 900 // loss: 0.054\n", "epoch: 49, batch: 1000 // loss: 0.049\n", "epoch: 49, batch: 1100 // loss: 0.047\n", "epoch: 49, batch: 1200 // loss: 0.049\n", "epoch: 49, batch: 1300 // loss: 0.052\n", "epoch: 49, batch: 1400 // loss: 0.047\n", "epoch: 49, batch: 1500 // loss: 0.053\n", "epoch: 49, batch: 1600 // loss: 0.055\n", "epoch: 49, batch: 1700 // loss: 0.049\n", "epoch: 49, batch: 1800 // loss: 0.057\n", "epoch: 49, batch: 1900 // loss: 0.051\n", "epoch: 49, batch: 2000 // loss: 0.052\n", "epoch: 49, batch: 2100 // loss: 0.053\n", "epoch: 49, batch: 2200 // loss: 0.056\n", "epoch: 49, batch: 2300 // loss: 0.054\n", "epoch: 49, batch: 2400 // loss: 0.046\n", "epoch: 49, batch: 2500 // loss: 0.047\n", "epoch: 49, batch: 2600 // loss: 0.049\n", "epoch: 49, batch: 2700 // loss: 0.047\n", "epoch: 49, batch: 2800 // loss: 0.052\n", "epoch: 49, batch: 2900 // loss: 0.046\n", "epoch: 49, batch: 3000 // loss: 0.049\n", "epoch: 49, batch: 3100 // loss: 0.048\n", "epoch: 49, batch: 3200 // loss: 0.043\n", "epoch: 49, batch: 3300 // loss: 0.043\n", "epoch: 49, batch: 3400 // loss: 0.048\n", "epoch: 49, batch: 3500 // loss: 0.040\n", "epoch: 49, batch: 3600 // loss: 0.047\n", "epoch: 49, batch: 3700 // loss: 0.049\n", "\n", "epoch: 50, batch: 0 // loss: 0.058\n", "epoch: 50, batch: 100 // loss: 0.053\n", "epoch: 50, batch: 200 // loss: 0.046\n", "epoch: 50, batch: 300 // loss: 0.053\n", "epoch: 50, batch: 400 // loss: 0.051\n", "epoch: 50, batch: 500 // loss: 0.043\n", "epoch: 50, batch: 600 // loss: 0.044\n", "epoch: 50, batch: 700 // loss: 0.047\n", "epoch: 50, batch: 800 // loss: 0.047\n", "epoch: 50, batch: 900 // loss: 0.054\n", "epoch: 50, batch: 1000 // loss: 0.048\n", "epoch: 50, batch: 1100 // loss: 0.047\n", "epoch: 50, batch: 1200 // loss: 0.049\n", "epoch: 50, batch: 1300 // loss: 0.051\n", "epoch: 50, batch: 1400 // loss: 0.046\n", "epoch: 50, batch: 1500 // loss: 0.052\n", "epoch: 50, batch: 1600 // loss: 0.055\n", "epoch: 50, batch: 1700 // loss: 0.049\n", "epoch: 50, batch: 1800 // loss: 0.056\n", "epoch: 50, batch: 1900 // loss: 0.050\n", "epoch: 50, batch: 2000 // loss: 0.051\n", "epoch: 50, batch: 2100 // loss: 0.052\n", "epoch: 50, batch: 2200 // loss: 0.055\n", "epoch: 50, batch: 2300 // loss: 0.053\n", "epoch: 50, batch: 2400 // loss: 0.045\n", "epoch: 50, batch: 2500 // loss: 0.047\n", "epoch: 50, batch: 2600 // loss: 0.048\n", "epoch: 50, batch: 2700 // loss: 0.046\n", "epoch: 50, batch: 2800 // loss: 0.051\n", "epoch: 50, batch: 2900 // loss: 0.046\n", "epoch: 50, batch: 3000 // loss: 0.048\n", "epoch: 50, batch: 3100 // loss: 0.047\n", "epoch: 50, batch: 3200 // loss: 0.043\n", "epoch: 50, batch: 3300 // loss: 0.042\n", "epoch: 50, batch: 3400 // loss: 0.048\n", "epoch: 50, batch: 3500 // loss: 0.039\n", "epoch: 50, batch: 3600 // loss: 0.046\n", "epoch: 50, batch: 3700 // loss: 0.048\n", "\n", "epoch: 51, batch: 0 // loss: 0.058\n", "epoch: 51, batch: 100 // loss: 0.052\n", "epoch: 51, batch: 200 // loss: 0.046\n", "epoch: 51, batch: 300 // loss: 0.052\n", "epoch: 51, batch: 400 // loss: 0.051\n", "epoch: 51, batch: 500 // loss: 0.042\n", "epoch: 51, batch: 600 // loss: 0.043\n", "epoch: 51, batch: 700 // loss: 0.047\n", "epoch: 51, batch: 800 // loss: 0.047\n", "epoch: 51, batch: 900 // loss: 0.053\n", "epoch: 51, batch: 1000 // loss: 0.048\n", "epoch: 51, batch: 1100 // loss: 0.046\n", "epoch: 51, batch: 1200 // loss: 0.048\n", "epoch: 51, batch: 1300 // loss: 0.051\n", "epoch: 51, batch: 1400 // loss: 0.046\n", "epoch: 51, batch: 1500 // loss: 0.052\n", "epoch: 51, batch: 1600 // loss: 0.054\n", "epoch: 51, batch: 1700 // loss: 0.049\n", "epoch: 51, batch: 1800 // loss: 0.056\n", "epoch: 51, batch: 1900 // loss: 0.050\n", "epoch: 51, batch: 2000 // loss: 0.051\n", "epoch: 51, batch: 2100 // loss: 0.051\n", "epoch: 51, batch: 2200 // loss: 0.054\n", "epoch: 51, batch: 2300 // loss: 0.053\n", "epoch: 51, batch: 2400 // loss: 0.045\n", "epoch: 51, batch: 2500 // loss: 0.046\n", "epoch: 51, batch: 2600 // loss: 0.048\n", "epoch: 51, batch: 2700 // loss: 0.046\n", "epoch: 51, batch: 2800 // loss: 0.051\n", "epoch: 51, batch: 2900 // loss: 0.045\n", "epoch: 51, batch: 3000 // loss: 0.048\n", "epoch: 51, batch: 3100 // loss: 0.047\n", "epoch: 51, batch: 3200 // loss: 0.042\n", "epoch: 51, batch: 3300 // loss: 0.042\n", "epoch: 51, batch: 3400 // loss: 0.047\n", "epoch: 51, batch: 3500 // loss: 0.039\n", "epoch: 51, batch: 3600 // loss: 0.046\n", "epoch: 51, batch: 3700 // loss: 0.048\n", "\n", "epoch: 52, batch: 0 // loss: 0.057\n", "epoch: 52, batch: 100 // loss: 0.051\n", "epoch: 52, batch: 200 // loss: 0.046\n", "epoch: 52, batch: 300 // loss: 0.052\n", "epoch: 52, batch: 400 // loss: 0.050\n", "epoch: 52, batch: 500 // loss: 0.042\n", "epoch: 52, batch: 600 // loss: 0.043\n", "epoch: 52, batch: 700 // loss: 0.047\n", "epoch: 52, batch: 800 // loss: 0.046\n", "epoch: 52, batch: 900 // loss: 0.052\n", "epoch: 52, batch: 1000 // loss: 0.048\n", "epoch: 52, batch: 1100 // loss: 0.046\n", "epoch: 52, batch: 1200 // loss: 0.048\n", "epoch: 52, batch: 1300 // loss: 0.050\n", "epoch: 52, batch: 1400 // loss: 0.045\n", "epoch: 52, batch: 1500 // loss: 0.051\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 52, batch: 1600 // loss: 0.054\n", "epoch: 52, batch: 1700 // loss: 0.048\n", "epoch: 52, batch: 1800 // loss: 0.055\n", "epoch: 52, batch: 1900 // loss: 0.049\n", "epoch: 52, batch: 2000 // loss: 0.050\n", "epoch: 52, batch: 2100 // loss: 0.051\n", "epoch: 52, batch: 2200 // loss: 0.054\n", "epoch: 52, batch: 2300 // loss: 0.052\n", "epoch: 52, batch: 2400 // loss: 0.044\n", "epoch: 52, batch: 2500 // loss: 0.046\n", "epoch: 52, batch: 2600 // loss: 0.048\n", "epoch: 52, batch: 2700 // loss: 0.045\n", "epoch: 52, batch: 2800 // loss: 0.050\n", "epoch: 52, batch: 2900 // loss: 0.045\n", "epoch: 52, batch: 3000 // loss: 0.048\n", "epoch: 52, batch: 3100 // loss: 0.046\n", "epoch: 52, batch: 3200 // loss: 0.042\n", "epoch: 52, batch: 3300 // loss: 0.041\n", "epoch: 52, batch: 3400 // loss: 0.047\n", "epoch: 52, batch: 3500 // loss: 0.038\n", "epoch: 52, batch: 3600 // loss: 0.046\n", "epoch: 52, batch: 3700 // loss: 0.047\n", "\n", "epoch: 53, batch: 0 // loss: 0.057\n", "epoch: 53, batch: 100 // loss: 0.051\n", "epoch: 53, batch: 200 // loss: 0.045\n", "epoch: 53, batch: 300 // loss: 0.051\n", "epoch: 53, batch: 400 // loss: 0.050\n", "epoch: 53, batch: 500 // loss: 0.042\n", "epoch: 53, batch: 600 // loss: 0.043\n", "epoch: 53, batch: 700 // loss: 0.046\n", "epoch: 53, batch: 800 // loss: 0.046\n", "epoch: 53, batch: 900 // loss: 0.052\n", "epoch: 53, batch: 1000 // loss: 0.047\n", "epoch: 53, batch: 1100 // loss: 0.045\n", "epoch: 53, batch: 1200 // loss: 0.047\n", "epoch: 53, batch: 1300 // loss: 0.049\n", "epoch: 53, batch: 1400 // loss: 0.045\n", "epoch: 53, batch: 1500 // loss: 0.051\n", "epoch: 53, batch: 1600 // loss: 0.054\n", "epoch: 53, batch: 1700 // loss: 0.048\n", "epoch: 53, batch: 1800 // loss: 0.055\n", "epoch: 53, batch: 1900 // loss: 0.049\n", "epoch: 53, batch: 2000 // loss: 0.050\n", "epoch: 53, batch: 2100 // loss: 0.050\n", "epoch: 53, batch: 2200 // loss: 0.053\n", "epoch: 53, batch: 2300 // loss: 0.052\n", "epoch: 53, batch: 2400 // loss: 0.044\n", "epoch: 53, batch: 2500 // loss: 0.045\n", "epoch: 53, batch: 2600 // loss: 0.047\n", "epoch: 53, batch: 2700 // loss: 0.045\n", "epoch: 53, batch: 2800 // loss: 0.050\n", "epoch: 53, batch: 2900 // loss: 0.044\n", "epoch: 53, batch: 3000 // loss: 0.047\n", "epoch: 53, batch: 3100 // loss: 0.046\n", "epoch: 53, batch: 3200 // loss: 0.041\n", "epoch: 53, batch: 3300 // loss: 0.041\n", "epoch: 53, batch: 3400 // loss: 0.046\n", "epoch: 53, batch: 3500 // loss: 0.038\n", "epoch: 53, batch: 3600 // loss: 0.045\n", "epoch: 53, batch: 3700 // loss: 0.047\n", "\n", "epoch: 54, batch: 0 // loss: 0.056\n", "epoch: 54, batch: 100 // loss: 0.050\n", "epoch: 54, batch: 200 // loss: 0.045\n", "epoch: 54, batch: 300 // loss: 0.051\n", "epoch: 54, batch: 400 // loss: 0.049\n", "epoch: 54, batch: 500 // loss: 0.041\n", "epoch: 54, batch: 600 // loss: 0.042\n", "epoch: 54, batch: 700 // loss: 0.046\n", "epoch: 54, batch: 800 // loss: 0.045\n", "epoch: 54, batch: 900 // loss: 0.052\n", "epoch: 54, batch: 1000 // loss: 0.047\n", "epoch: 54, batch: 1100 // loss: 0.045\n", "epoch: 54, batch: 1200 // loss: 0.047\n", "epoch: 54, batch: 1300 // loss: 0.049\n", "epoch: 54, batch: 1400 // loss: 0.045\n", "epoch: 54, batch: 1500 // loss: 0.051\n", "epoch: 54, batch: 1600 // loss: 0.053\n", "epoch: 54, batch: 1700 // loss: 0.047\n", "epoch: 54, batch: 1800 // loss: 0.055\n", "epoch: 54, batch: 1900 // loss: 0.048\n", "epoch: 54, batch: 2000 // loss: 0.049\n", "epoch: 54, batch: 2100 // loss: 0.050\n", "epoch: 54, batch: 2200 // loss: 0.053\n", "epoch: 54, batch: 2300 // loss: 0.051\n", "epoch: 54, batch: 2400 // loss: 0.044\n", "epoch: 54, batch: 2500 // loss: 0.045\n", "epoch: 54, batch: 2600 // loss: 0.047\n", "epoch: 54, batch: 2700 // loss: 0.044\n", "epoch: 54, batch: 2800 // loss: 0.049\n", "epoch: 54, batch: 2900 // loss: 0.044\n", "epoch: 54, batch: 3000 // loss: 0.047\n", "epoch: 54, batch: 3100 // loss: 0.045\n", "epoch: 54, batch: 3200 // loss: 0.041\n", "epoch: 54, batch: 3300 // loss: 0.040\n", "epoch: 54, batch: 3400 // loss: 0.046\n", "epoch: 54, batch: 3500 // loss: 0.037\n", "epoch: 54, batch: 3600 // loss: 0.045\n", "epoch: 54, batch: 3700 // loss: 0.046\n", "\n", "epoch: 55, batch: 0 // loss: 0.056\n", "epoch: 55, batch: 100 // loss: 0.050\n", "epoch: 55, batch: 200 // loss: 0.045\n", "epoch: 55, batch: 300 // loss: 0.051\n", "epoch: 55, batch: 400 // loss: 0.049\n", "epoch: 55, batch: 500 // loss: 0.041\n", "epoch: 55, batch: 600 // loss: 0.042\n", "epoch: 55, batch: 700 // loss: 0.046\n", "epoch: 55, batch: 800 // loss: 0.045\n", "epoch: 55, batch: 900 // loss: 0.051\n", "epoch: 55, batch: 1000 // loss: 0.047\n", "epoch: 55, batch: 1100 // loss: 0.045\n", "epoch: 55, batch: 1200 // loss: 0.046\n", "epoch: 55, batch: 1300 // loss: 0.048\n", "epoch: 55, batch: 1400 // loss: 0.044\n", "epoch: 55, batch: 1500 // loss: 0.050\n", "epoch: 55, batch: 1600 // loss: 0.053\n", "epoch: 55, batch: 1700 // loss: 0.047\n", "epoch: 55, batch: 1800 // loss: 0.054\n", "epoch: 55, batch: 1900 // loss: 0.048\n", "epoch: 55, batch: 2000 // loss: 0.049\n", "epoch: 55, batch: 2100 // loss: 0.049\n", "epoch: 55, batch: 2200 // loss: 0.052\n", "epoch: 55, batch: 2300 // loss: 0.051\n", "epoch: 55, batch: 2400 // loss: 0.044\n", "epoch: 55, batch: 2500 // loss: 0.045\n", "epoch: 55, batch: 2600 // loss: 0.047\n", "epoch: 55, batch: 2700 // loss: 0.044\n", "epoch: 55, batch: 2800 // loss: 0.049\n", "epoch: 55, batch: 2900 // loss: 0.044\n", "epoch: 55, batch: 3000 // loss: 0.047\n", "epoch: 55, batch: 3100 // loss: 0.045\n", "epoch: 55, batch: 3200 // loss: 0.041\n", "epoch: 55, batch: 3300 // loss: 0.040\n", "epoch: 55, batch: 3400 // loss: 0.046\n", "epoch: 55, batch: 3500 // loss: 0.037\n", "epoch: 55, batch: 3600 // loss: 0.045\n", "epoch: 55, batch: 3700 // loss: 0.046\n", "\n", "epoch: 56, batch: 0 // loss: 0.056\n", "epoch: 56, batch: 100 // loss: 0.049\n", "epoch: 56, batch: 200 // loss: 0.044\n", "epoch: 56, batch: 300 // loss: 0.050\n", "epoch: 56, batch: 400 // loss: 0.048\n", "epoch: 56, batch: 500 // loss: 0.041\n", "epoch: 56, batch: 600 // loss: 0.042\n", "epoch: 56, batch: 700 // loss: 0.046\n", "epoch: 56, batch: 800 // loss: 0.044\n", "epoch: 56, batch: 900 // loss: 0.051\n", "epoch: 56, batch: 1000 // loss: 0.047\n", "epoch: 56, batch: 1100 // loss: 0.044\n", "epoch: 56, batch: 1200 // loss: 0.046\n", "epoch: 56, batch: 1300 // loss: 0.048\n", "epoch: 56, batch: 1400 // loss: 0.044\n", "epoch: 56, batch: 1500 // loss: 0.050\n", "epoch: 56, batch: 1600 // loss: 0.053\n", "epoch: 56, batch: 1700 // loss: 0.047\n", "epoch: 56, batch: 1800 // loss: 0.054\n", "epoch: 56, batch: 1900 // loss: 0.047\n", "epoch: 56, batch: 2000 // loss: 0.048\n", "epoch: 56, batch: 2100 // loss: 0.049\n", "epoch: 56, batch: 2200 // loss: 0.052\n", "epoch: 56, batch: 2300 // loss: 0.051\n", "epoch: 56, batch: 2400 // loss: 0.043\n", "epoch: 56, batch: 2500 // loss: 0.044\n", "epoch: 56, batch: 2600 // loss: 0.046\n", "epoch: 56, batch: 2700 // loss: 0.044\n", "epoch: 56, batch: 2800 // loss: 0.048\n", "epoch: 56, batch: 2900 // loss: 0.044\n", "epoch: 56, batch: 3000 // loss: 0.047\n", "epoch: 56, batch: 3100 // loss: 0.045\n", "epoch: 56, batch: 3200 // loss: 0.041\n", "epoch: 56, batch: 3300 // loss: 0.040\n", "epoch: 56, batch: 3400 // loss: 0.046\n", "epoch: 56, batch: 3500 // loss: 0.037\n", "epoch: 56, batch: 3600 // loss: 0.045\n", "epoch: 56, batch: 3700 // loss: 0.045\n", "\n", "epoch: 57, batch: 0 // loss: 0.055\n", "epoch: 57, batch: 100 // loss: 0.049\n", "epoch: 57, batch: 200 // loss: 0.044\n", "epoch: 57, batch: 300 // loss: 0.050\n", "epoch: 57, batch: 400 // loss: 0.048\n", "epoch: 57, batch: 500 // loss: 0.041\n", "epoch: 57, batch: 600 // loss: 0.042\n", "epoch: 57, batch: 700 // loss: 0.045\n", "epoch: 57, batch: 800 // loss: 0.044\n", "epoch: 57, batch: 900 // loss: 0.051\n", "epoch: 57, batch: 1000 // loss: 0.046\n", "epoch: 57, batch: 1100 // loss: 0.044\n", "epoch: 57, batch: 1200 // loss: 0.046\n", "epoch: 57, batch: 1300 // loss: 0.047\n", "epoch: 57, batch: 1400 // loss: 0.044\n", "epoch: 57, batch: 1500 // loss: 0.050\n", "epoch: 57, batch: 1600 // loss: 0.053\n", "epoch: 57, batch: 1700 // loss: 0.047\n", "epoch: 57, batch: 1800 // loss: 0.054\n", "epoch: 57, batch: 1900 // loss: 0.047\n", "epoch: 57, batch: 2000 // loss: 0.048\n", "epoch: 57, batch: 2100 // loss: 0.049\n", "epoch: 57, batch: 2200 // loss: 0.051\n", "epoch: 57, batch: 2300 // loss: 0.051\n", "epoch: 57, batch: 2400 // loss: 0.043\n", "epoch: 57, batch: 2500 // loss: 0.044\n", "epoch: 57, batch: 2600 // loss: 0.046\n", "epoch: 57, batch: 2700 // loss: 0.044\n", "epoch: 57, batch: 2800 // loss: 0.048\n", "epoch: 57, batch: 2900 // loss: 0.043\n", "epoch: 57, batch: 3000 // loss: 0.047\n", "epoch: 57, batch: 3100 // loss: 0.045\n", "epoch: 57, batch: 3200 // loss: 0.040\n", "epoch: 57, batch: 3300 // loss: 0.040\n", "epoch: 57, batch: 3400 // loss: 0.045\n", "epoch: 57, batch: 3500 // loss: 0.036\n", "epoch: 57, batch: 3600 // loss: 0.044\n", "epoch: 57, batch: 3700 // loss: 0.045\n", "\n", "epoch: 58, batch: 0 // loss: 0.055\n", "epoch: 58, batch: 100 // loss: 0.048\n", "epoch: 58, batch: 200 // loss: 0.044\n", "epoch: 58, batch: 300 // loss: 0.050\n", "epoch: 58, batch: 400 // loss: 0.048\n", "epoch: 58, batch: 500 // loss: 0.041\n", "epoch: 58, batch: 600 // loss: 0.041\n", "epoch: 58, batch: 700 // loss: 0.045\n", "epoch: 58, batch: 800 // loss: 0.044\n", "epoch: 58, batch: 900 // loss: 0.050\n", "epoch: 58, batch: 1000 // loss: 0.046\n", "epoch: 58, batch: 1100 // loss: 0.044\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 58, batch: 1200 // loss: 0.045\n", "epoch: 58, batch: 1300 // loss: 0.047\n", "epoch: 58, batch: 1400 // loss: 0.044\n", "epoch: 58, batch: 1500 // loss: 0.049\n", "epoch: 58, batch: 1600 // loss: 0.053\n", "epoch: 58, batch: 1700 // loss: 0.046\n", "epoch: 58, batch: 1800 // loss: 0.054\n", "epoch: 58, batch: 1900 // loss: 0.047\n", "epoch: 58, batch: 2000 // loss: 0.048\n", "epoch: 58, batch: 2100 // loss: 0.048\n", "epoch: 58, batch: 2200 // loss: 0.051\n", "epoch: 58, batch: 2300 // loss: 0.050\n", "epoch: 58, batch: 2400 // loss: 0.043\n", "epoch: 58, batch: 2500 // loss: 0.044\n", "epoch: 58, batch: 2600 // loss: 0.046\n", "epoch: 58, batch: 2700 // loss: 0.044\n", "epoch: 58, batch: 2800 // loss: 0.048\n", "epoch: 58, batch: 2900 // loss: 0.043\n", "epoch: 58, batch: 3000 // loss: 0.046\n", "epoch: 58, batch: 3100 // loss: 0.044\n", "epoch: 58, batch: 3200 // loss: 0.040\n", "epoch: 58, batch: 3300 // loss: 0.039\n", "epoch: 58, batch: 3400 // loss: 0.045\n", "epoch: 58, batch: 3500 // loss: 0.036\n", "epoch: 58, batch: 3600 // loss: 0.044\n", "epoch: 58, batch: 3700 // loss: 0.045\n", "\n", "epoch: 59, batch: 0 // loss: 0.055\n", "epoch: 59, batch: 100 // loss: 0.048\n", "epoch: 59, batch: 200 // loss: 0.044\n", "epoch: 59, batch: 300 // loss: 0.050\n", "epoch: 59, batch: 400 // loss: 0.048\n", "epoch: 59, batch: 500 // loss: 0.040\n", "epoch: 59, batch: 600 // loss: 0.041\n", "epoch: 59, batch: 700 // loss: 0.045\n", "epoch: 59, batch: 800 // loss: 0.044\n", "epoch: 59, batch: 900 // loss: 0.050\n", "epoch: 59, batch: 1000 // loss: 0.046\n", "epoch: 59, batch: 1100 // loss: 0.044\n", "epoch: 59, batch: 1200 // loss: 0.045\n", "epoch: 59, batch: 1300 // loss: 0.047\n", "epoch: 59, batch: 1400 // loss: 0.043\n", "epoch: 59, batch: 1500 // loss: 0.049\n", "epoch: 59, batch: 1600 // loss: 0.052\n", "epoch: 59, batch: 1700 // loss: 0.046\n", "epoch: 59, batch: 1800 // loss: 0.054\n", "epoch: 59, batch: 1900 // loss: 0.047\n", "epoch: 59, batch: 2000 // loss: 0.048\n", "epoch: 59, batch: 2100 // loss: 0.048\n", "epoch: 59, batch: 2200 // loss: 0.051\n", "epoch: 59, batch: 2300 // loss: 0.050\n", "epoch: 59, batch: 2400 // loss: 0.043\n", "epoch: 59, batch: 2500 // loss: 0.044\n", "epoch: 59, batch: 2600 // loss: 0.046\n", "epoch: 59, batch: 2700 // loss: 0.043\n", "epoch: 59, batch: 2800 // loss: 0.047\n", "epoch: 59, batch: 2900 // loss: 0.043\n", "epoch: 59, batch: 3000 // loss: 0.046\n", "epoch: 59, batch: 3100 // loss: 0.044\n", "epoch: 59, batch: 3200 // loss: 0.040\n", "epoch: 59, batch: 3300 // loss: 0.039\n", "epoch: 59, batch: 3400 // loss: 0.045\n", "epoch: 59, batch: 3500 // loss: 0.036\n", "epoch: 59, batch: 3600 // loss: 0.044\n", "epoch: 59, batch: 3700 // loss: 0.045\n", "\n", "epoch: 60, batch: 0 // loss: 0.054\n", "epoch: 60, batch: 100 // loss: 0.048\n", "epoch: 60, batch: 200 // loss: 0.044\n", "epoch: 60, batch: 300 // loss: 0.050\n", "epoch: 60, batch: 400 // loss: 0.047\n", "epoch: 60, batch: 500 // loss: 0.040\n", "epoch: 60, batch: 600 // loss: 0.041\n", "epoch: 60, batch: 700 // loss: 0.045\n", "epoch: 60, batch: 800 // loss: 0.043\n", "epoch: 60, batch: 900 // loss: 0.050\n", "epoch: 60, batch: 1000 // loss: 0.046\n", "epoch: 60, batch: 1100 // loss: 0.044\n", "epoch: 60, batch: 1200 // loss: 0.045\n", "epoch: 60, batch: 1300 // loss: 0.047\n", "epoch: 60, batch: 1400 // loss: 0.043\n", "epoch: 60, batch: 1500 // loss: 0.049\n", "epoch: 60, batch: 1600 // loss: 0.052\n", "epoch: 60, batch: 1700 // loss: 0.046\n", "epoch: 60, batch: 1800 // loss: 0.053\n", "epoch: 60, batch: 1900 // loss: 0.046\n", "epoch: 60, batch: 2000 // loss: 0.048\n", "epoch: 60, batch: 2100 // loss: 0.048\n", "epoch: 60, batch: 2200 // loss: 0.051\n", "epoch: 60, batch: 2300 // loss: 0.050\n", "epoch: 60, batch: 2400 // loss: 0.043\n", "epoch: 60, batch: 2500 // loss: 0.044\n", "epoch: 60, batch: 2600 // loss: 0.046\n", "epoch: 60, batch: 2700 // loss: 0.043\n", "epoch: 60, batch: 2800 // loss: 0.047\n", "epoch: 60, batch: 2900 // loss: 0.043\n", "epoch: 60, batch: 3000 // loss: 0.046\n", "epoch: 60, batch: 3100 // loss: 0.044\n", "epoch: 60, batch: 3200 // loss: 0.040\n", "epoch: 60, batch: 3300 // loss: 0.039\n", "epoch: 60, batch: 3400 // loss: 0.045\n", "epoch: 60, batch: 3500 // loss: 0.036\n", "epoch: 60, batch: 3600 // loss: 0.044\n", "epoch: 60, batch: 3700 // loss: 0.044\n", "\n", "epoch: 61, batch: 0 // loss: 0.054\n", "epoch: 61, batch: 100 // loss: 0.048\n", "epoch: 61, batch: 200 // loss: 0.044\n", "epoch: 61, batch: 300 // loss: 0.050\n", "epoch: 61, batch: 400 // loss: 0.047\n", "epoch: 61, batch: 500 // loss: 0.040\n", "epoch: 61, batch: 600 // loss: 0.041\n", "epoch: 61, batch: 700 // loss: 0.045\n", "epoch: 61, batch: 800 // loss: 0.043\n", "epoch: 61, batch: 900 // loss: 0.050\n", "epoch: 61, batch: 1000 // loss: 0.046\n", "epoch: 61, batch: 1100 // loss: 0.043\n", "epoch: 61, batch: 1200 // loss: 0.045\n", "epoch: 61, batch: 1300 // loss: 0.046\n", "epoch: 61, batch: 1400 // loss: 0.043\n", "epoch: 61, batch: 1500 // loss: 0.049\n", "epoch: 61, batch: 1600 // loss: 0.052\n", "epoch: 61, batch: 1700 // loss: 0.046\n", "epoch: 61, batch: 1800 // loss: 0.053\n", "epoch: 61, batch: 1900 // loss: 0.046\n", "epoch: 61, batch: 2000 // loss: 0.047\n", "epoch: 61, batch: 2100 // loss: 0.048\n", "epoch: 61, batch: 2200 // loss: 0.051\n", "epoch: 61, batch: 2300 // loss: 0.050\n", "epoch: 61, batch: 2400 // loss: 0.043\n", "epoch: 61, batch: 2500 // loss: 0.043\n", "epoch: 61, batch: 2600 // loss: 0.046\n", "epoch: 61, batch: 2700 // loss: 0.043\n", "epoch: 61, batch: 2800 // loss: 0.047\n", "epoch: 61, batch: 2900 // loss: 0.043\n", "epoch: 61, batch: 3000 // loss: 0.046\n", "epoch: 61, batch: 3100 // loss: 0.044\n", "epoch: 61, batch: 3200 // loss: 0.040\n", "epoch: 61, batch: 3300 // loss: 0.039\n", "epoch: 61, batch: 3400 // loss: 0.045\n", "epoch: 61, batch: 3500 // loss: 0.036\n", "epoch: 61, batch: 3600 // loss: 0.044\n", "epoch: 61, batch: 3700 // loss: 0.044\n", "\n", "epoch: 62, batch: 0 // loss: 0.054\n", "epoch: 62, batch: 100 // loss: 0.047\n", "epoch: 62, batch: 200 // loss: 0.043\n", "epoch: 62, batch: 300 // loss: 0.049\n", "epoch: 62, batch: 400 // loss: 0.047\n", "epoch: 62, batch: 500 // loss: 0.040\n", "epoch: 62, batch: 600 // loss: 0.041\n", "epoch: 62, batch: 700 // loss: 0.045\n", "epoch: 62, batch: 800 // loss: 0.043\n", "epoch: 62, batch: 900 // loss: 0.050\n", "epoch: 62, batch: 1000 // loss: 0.046\n", "epoch: 62, batch: 1100 // loss: 0.043\n", "epoch: 62, batch: 1200 // loss: 0.045\n", "epoch: 62, batch: 1300 // loss: 0.046\n", "epoch: 62, batch: 1400 // loss: 0.043\n", "epoch: 62, batch: 1500 // loss: 0.049\n", "epoch: 62, batch: 1600 // loss: 0.052\n", "epoch: 62, batch: 1700 // loss: 0.046\n", "epoch: 62, batch: 1800 // loss: 0.053\n", "epoch: 62, batch: 1900 // loss: 0.046\n", "epoch: 62, batch: 2000 // loss: 0.047\n", "epoch: 62, batch: 2100 // loss: 0.047\n", "epoch: 62, batch: 2200 // loss: 0.050\n", "epoch: 62, batch: 2300 // loss: 0.050\n", "epoch: 62, batch: 2400 // loss: 0.043\n", "epoch: 62, batch: 2500 // loss: 0.043\n", "epoch: 62, batch: 2600 // loss: 0.045\n", "epoch: 62, batch: 2700 // loss: 0.043\n", "epoch: 62, batch: 2800 // loss: 0.047\n", "epoch: 62, batch: 2900 // loss: 0.043\n", "epoch: 62, batch: 3000 // loss: 0.046\n", "epoch: 62, batch: 3100 // loss: 0.044\n", "epoch: 62, batch: 3200 // loss: 0.040\n", "epoch: 62, batch: 3300 // loss: 0.039\n", "epoch: 62, batch: 3400 // loss: 0.045\n", "epoch: 62, batch: 3500 // loss: 0.035\n", "epoch: 62, batch: 3600 // loss: 0.044\n", "epoch: 62, batch: 3700 // loss: 0.044\n", "\n", "epoch: 63, batch: 0 // loss: 0.054\n", "epoch: 63, batch: 100 // loss: 0.047\n", "epoch: 63, batch: 200 // loss: 0.043\n", "epoch: 63, batch: 300 // loss: 0.049\n", "epoch: 63, batch: 400 // loss: 0.047\n", "epoch: 63, batch: 500 // loss: 0.040\n", "epoch: 63, batch: 600 // loss: 0.041\n", "epoch: 63, batch: 700 // loss: 0.045\n", "epoch: 63, batch: 800 // loss: 0.043\n", "epoch: 63, batch: 900 // loss: 0.050\n", "epoch: 63, batch: 1000 // loss: 0.046\n", "epoch: 63, batch: 1100 // loss: 0.043\n", "epoch: 63, batch: 1200 // loss: 0.045\n", "epoch: 63, batch: 1300 // loss: 0.046\n", "epoch: 63, batch: 1400 // loss: 0.043\n", "epoch: 63, batch: 1500 // loss: 0.049\n", "epoch: 63, batch: 1600 // loss: 0.052\n", "epoch: 63, batch: 1700 // loss: 0.046\n", "epoch: 63, batch: 1800 // loss: 0.053\n", "epoch: 63, batch: 1900 // loss: 0.046\n", "epoch: 63, batch: 2000 // loss: 0.047\n", "epoch: 63, batch: 2100 // loss: 0.047\n", "epoch: 63, batch: 2200 // loss: 0.050\n", "epoch: 63, batch: 2300 // loss: 0.049\n", "epoch: 63, batch: 2400 // loss: 0.043\n", "epoch: 63, batch: 2500 // loss: 0.043\n", "epoch: 63, batch: 2600 // loss: 0.045\n", "epoch: 63, batch: 2700 // loss: 0.043\n", "epoch: 63, batch: 2800 // loss: 0.047\n", "epoch: 63, batch: 2900 // loss: 0.043\n", "epoch: 63, batch: 3000 // loss: 0.046\n", "epoch: 63, batch: 3100 // loss: 0.044\n", "epoch: 63, batch: 3200 // loss: 0.040\n", "epoch: 63, batch: 3300 // loss: 0.039\n", "epoch: 63, batch: 3400 // loss: 0.045\n", "epoch: 63, batch: 3500 // loss: 0.035\n", "epoch: 63, batch: 3600 // loss: 0.044\n", "epoch: 63, batch: 3700 // loss: 0.044\n", "\n", "epoch: 64, batch: 0 // loss: 0.054\n", "epoch: 64, batch: 100 // loss: 0.047\n", "epoch: 64, batch: 200 // loss: 0.043\n", "epoch: 64, batch: 300 // loss: 0.049\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 64, batch: 400 // loss: 0.047\n", "epoch: 64, batch: 500 // loss: 0.040\n", "epoch: 64, batch: 600 // loss: 0.041\n", "epoch: 64, batch: 700 // loss: 0.045\n", "epoch: 64, batch: 800 // loss: 0.043\n", "epoch: 64, batch: 900 // loss: 0.049\n", "epoch: 64, batch: 1000 // loss: 0.046\n", "epoch: 64, batch: 1100 // loss: 0.043\n", "epoch: 64, batch: 1200 // loss: 0.045\n", "epoch: 64, batch: 1300 // loss: 0.046\n", "epoch: 64, batch: 1400 // loss: 0.043\n", "epoch: 64, batch: 1500 // loss: 0.049\n", "epoch: 64, batch: 1600 // loss: 0.052\n", "epoch: 64, batch: 1700 // loss: 0.046\n", "epoch: 64, batch: 1800 // loss: 0.053\n", "epoch: 64, batch: 1900 // loss: 0.046\n", "epoch: 64, batch: 2000 // loss: 0.047\n", "epoch: 64, batch: 2100 // loss: 0.047\n", "epoch: 64, batch: 2200 // loss: 0.050\n", "epoch: 64, batch: 2300 // loss: 0.049\n", "epoch: 64, batch: 2400 // loss: 0.043\n", "epoch: 64, batch: 2500 // loss: 0.043\n", "epoch: 64, batch: 2600 // loss: 0.045\n", "epoch: 64, batch: 2700 // loss: 0.043\n", "epoch: 64, batch: 2800 // loss: 0.047\n", "epoch: 64, batch: 2900 // loss: 0.042\n", "epoch: 64, batch: 3000 // loss: 0.046\n", "epoch: 64, batch: 3100 // loss: 0.044\n", "epoch: 64, batch: 3200 // loss: 0.040\n", "epoch: 64, batch: 3300 // loss: 0.039\n", "epoch: 64, batch: 3400 // loss: 0.045\n", "epoch: 64, batch: 3500 // loss: 0.035\n", "epoch: 64, batch: 3600 // loss: 0.044\n", "epoch: 64, batch: 3700 // loss: 0.044\n", "\n", "epoch: 65, batch: 0 // loss: 0.054\n", "epoch: 65, batch: 100 // loss: 0.047\n", "epoch: 65, batch: 200 // loss: 0.043\n", "epoch: 65, batch: 300 // loss: 0.049\n", "epoch: 65, batch: 400 // loss: 0.047\n", "epoch: 65, batch: 500 // loss: 0.040\n", "epoch: 65, batch: 600 // loss: 0.041\n", "epoch: 65, batch: 700 // loss: 0.045\n", "epoch: 65, batch: 800 // loss: 0.043\n", "epoch: 65, batch: 900 // loss: 0.049\n", "epoch: 65, batch: 1000 // loss: 0.046\n", "epoch: 65, batch: 1100 // loss: 0.043\n", "epoch: 65, batch: 1200 // loss: 0.044\n", "epoch: 65, batch: 1300 // loss: 0.046\n", "epoch: 65, batch: 1400 // loss: 0.043\n", "epoch: 65, batch: 1500 // loss: 0.049\n", "epoch: 65, batch: 1600 // loss: 0.052\n", "epoch: 65, batch: 1700 // loss: 0.046\n", "epoch: 65, batch: 1800 // loss: 0.053\n", "epoch: 65, batch: 1900 // loss: 0.046\n", "epoch: 65, batch: 2000 // loss: 0.047\n", "epoch: 65, batch: 2100 // loss: 0.047\n", "epoch: 65, batch: 2200 // loss: 0.050\n", "epoch: 65, batch: 2300 // loss: 0.049\n", "epoch: 65, batch: 2400 // loss: 0.042\n", "epoch: 65, batch: 2500 // loss: 0.043\n", "epoch: 65, batch: 2600 // loss: 0.045\n", "epoch: 65, batch: 2700 // loss: 0.043\n", "epoch: 65, batch: 2800 // loss: 0.047\n", "epoch: 65, batch: 2900 // loss: 0.042\n", "epoch: 65, batch: 3000 // loss: 0.046\n", "epoch: 65, batch: 3100 // loss: 0.043\n", "epoch: 65, batch: 3200 // loss: 0.039\n", "epoch: 65, batch: 3300 // loss: 0.039\n", "epoch: 65, batch: 3400 // loss: 0.045\n", "epoch: 65, batch: 3500 // loss: 0.035\n", "epoch: 65, batch: 3600 // loss: 0.044\n", "epoch: 65, batch: 3700 // loss: 0.044\n", "\n", "epoch: 66, batch: 0 // loss: 0.054\n", "epoch: 66, batch: 100 // loss: 0.047\n", "epoch: 66, batch: 200 // loss: 0.043\n", "epoch: 66, batch: 300 // loss: 0.049\n", "epoch: 66, batch: 400 // loss: 0.047\n", "epoch: 66, batch: 500 // loss: 0.040\n", "epoch: 66, batch: 600 // loss: 0.041\n", "epoch: 66, batch: 700 // loss: 0.045\n", "epoch: 66, batch: 800 // loss: 0.043\n", "epoch: 66, batch: 900 // loss: 0.049\n", "epoch: 66, batch: 1000 // loss: 0.046\n", "epoch: 66, batch: 1100 // loss: 0.043\n", "epoch: 66, batch: 1200 // loss: 0.044\n", "epoch: 66, batch: 1300 // loss: 0.046\n", "epoch: 66, batch: 1400 // loss: 0.043\n", "epoch: 66, batch: 1500 // loss: 0.048\n", "epoch: 66, batch: 1600 // loss: 0.052\n", "epoch: 66, batch: 1700 // loss: 0.046\n", "epoch: 66, batch: 1800 // loss: 0.053\n", "epoch: 66, batch: 1900 // loss: 0.046\n", "epoch: 66, batch: 2000 // loss: 0.047\n", "epoch: 66, batch: 2100 // loss: 0.047\n", "epoch: 66, batch: 2200 // loss: 0.050\n", "epoch: 66, batch: 2300 // loss: 0.049\n", "epoch: 66, batch: 2400 // loss: 0.042\n", "epoch: 66, batch: 2500 // loss: 0.043\n", "epoch: 66, batch: 2600 // loss: 0.045\n", "epoch: 66, batch: 2700 // loss: 0.043\n", "epoch: 66, batch: 2800 // loss: 0.047\n", "epoch: 66, batch: 2900 // loss: 0.042\n", "epoch: 66, batch: 3000 // loss: 0.046\n", "epoch: 66, batch: 3100 // loss: 0.043\n", "epoch: 66, batch: 3200 // loss: 0.039\n", "epoch: 66, batch: 3300 // loss: 0.039\n", "epoch: 66, batch: 3400 // loss: 0.045\n", "epoch: 66, batch: 3500 // loss: 0.035\n", "epoch: 66, batch: 3600 // loss: 0.043\n", "epoch: 66, batch: 3700 // loss: 0.044\n", "\n", "epoch: 67, batch: 0 // loss: 0.054\n", "epoch: 67, batch: 100 // loss: 0.047\n", "epoch: 67, batch: 200 // loss: 0.043\n", "epoch: 67, batch: 300 // loss: 0.049\n", "epoch: 67, batch: 400 // loss: 0.047\n", "epoch: 67, batch: 500 // loss: 0.040\n", "epoch: 67, batch: 600 // loss: 0.041\n", "epoch: 67, batch: 700 // loss: 0.045\n", "epoch: 67, batch: 800 // loss: 0.043\n", "epoch: 67, batch: 900 // loss: 0.049\n", "epoch: 67, batch: 1000 // loss: 0.046\n", "epoch: 67, batch: 1100 // loss: 0.043\n", "epoch: 67, batch: 1200 // loss: 0.044\n", "epoch: 67, batch: 1300 // loss: 0.046\n", "epoch: 67, batch: 1400 // loss: 0.043\n", "epoch: 67, batch: 1500 // loss: 0.048\n", "epoch: 67, batch: 1600 // loss: 0.052\n", "epoch: 67, batch: 1700 // loss: 0.046\n", "epoch: 67, batch: 1800 // loss: 0.053\n", "epoch: 67, batch: 1900 // loss: 0.046\n", "epoch: 67, batch: 2000 // loss: 0.047\n", "epoch: 67, batch: 2100 // loss: 0.047\n", "epoch: 67, batch: 2200 // loss: 0.050\n", "epoch: 67, batch: 2300 // loss: 0.049\n", "epoch: 67, batch: 2400 // loss: 0.042\n", "epoch: 67, batch: 2500 // loss: 0.043\n", "epoch: 67, batch: 2600 // loss: 0.045\n", "epoch: 67, batch: 2700 // loss: 0.043\n", "epoch: 67, batch: 2800 // loss: 0.046\n", "epoch: 67, batch: 2900 // loss: 0.042\n", "epoch: 67, batch: 3000 // loss: 0.046\n", "epoch: 67, batch: 3100 // loss: 0.043\n", "epoch: 67, batch: 3200 // loss: 0.039\n", "epoch: 67, batch: 3300 // loss: 0.039\n", "epoch: 67, batch: 3400 // loss: 0.044\n", "epoch: 67, batch: 3500 // loss: 0.035\n", "epoch: 67, batch: 3600 // loss: 0.043\n", "epoch: 67, batch: 3700 // loss: 0.044\n", "\n", "epoch: 68, batch: 0 // loss: 0.054\n", "epoch: 68, batch: 100 // loss: 0.047\n", "epoch: 68, batch: 200 // loss: 0.043\n", "epoch: 68, batch: 300 // loss: 0.049\n", "epoch: 68, batch: 400 // loss: 0.046\n", "epoch: 68, batch: 500 // loss: 0.040\n", "epoch: 68, batch: 600 // loss: 0.041\n", "epoch: 68, batch: 700 // loss: 0.045\n", "epoch: 68, batch: 800 // loss: 0.042\n", "epoch: 68, batch: 900 // loss: 0.049\n", "epoch: 68, batch: 1000 // loss: 0.046\n", "epoch: 68, batch: 1100 // loss: 0.043\n", "epoch: 68, batch: 1200 // loss: 0.044\n", "epoch: 68, batch: 1300 // loss: 0.046\n", "epoch: 68, batch: 1400 // loss: 0.043\n", "epoch: 68, batch: 1500 // loss: 0.048\n", "epoch: 68, batch: 1600 // loss: 0.052\n", "epoch: 68, batch: 1700 // loss: 0.046\n", "epoch: 68, batch: 1800 // loss: 0.053\n", "epoch: 68, batch: 1900 // loss: 0.046\n", "epoch: 68, batch: 2000 // loss: 0.047\n", "epoch: 68, batch: 2100 // loss: 0.047\n", "epoch: 68, batch: 2200 // loss: 0.050\n", "epoch: 68, batch: 2300 // loss: 0.049\n", "epoch: 68, batch: 2400 // loss: 0.042\n", "epoch: 68, batch: 2500 // loss: 0.043\n", "epoch: 68, batch: 2600 // loss: 0.045\n", "epoch: 68, batch: 2700 // loss: 0.043\n", "epoch: 68, batch: 2800 // loss: 0.046\n", "epoch: 68, batch: 2900 // loss: 0.042\n", "epoch: 68, batch: 3000 // loss: 0.046\n", "epoch: 68, batch: 3100 // loss: 0.043\n", "epoch: 68, batch: 3200 // loss: 0.039\n", "epoch: 68, batch: 3300 // loss: 0.038\n", "epoch: 68, batch: 3400 // loss: 0.044\n", "epoch: 68, batch: 3500 // loss: 0.035\n", "epoch: 68, batch: 3600 // loss: 0.043\n", "epoch: 68, batch: 3700 // loss: 0.044\n", "\n", "epoch: 69, batch: 0 // loss: 0.054\n", "epoch: 69, batch: 100 // loss: 0.047\n", "epoch: 69, batch: 200 // loss: 0.043\n", "epoch: 69, batch: 300 // loss: 0.049\n", "epoch: 69, batch: 400 // loss: 0.046\n", "epoch: 69, batch: 500 // loss: 0.040\n", "epoch: 69, batch: 600 // loss: 0.041\n", "epoch: 69, batch: 700 // loss: 0.044\n", "epoch: 69, batch: 800 // loss: 0.042\n", "epoch: 69, batch: 900 // loss: 0.049\n", "epoch: 69, batch: 1000 // loss: 0.046\n", "epoch: 69, batch: 1100 // loss: 0.043\n", "epoch: 69, batch: 1200 // loss: 0.044\n", "epoch: 69, batch: 1300 // loss: 0.046\n", "epoch: 69, batch: 1400 // loss: 0.043\n", "epoch: 69, batch: 1500 // loss: 0.048\n", "epoch: 69, batch: 1600 // loss: 0.052\n", "epoch: 69, batch: 1700 // loss: 0.045\n", "epoch: 69, batch: 1800 // loss: 0.053\n", "epoch: 69, batch: 1900 // loss: 0.045\n", "epoch: 69, batch: 2000 // loss: 0.047\n", "epoch: 69, batch: 2100 // loss: 0.047\n", "epoch: 69, batch: 2200 // loss: 0.050\n", "epoch: 69, batch: 2300 // loss: 0.049\n", "epoch: 69, batch: 2400 // loss: 0.042\n", "epoch: 69, batch: 2500 // loss: 0.043\n", "epoch: 69, batch: 2600 // loss: 0.045\n", "epoch: 69, batch: 2700 // loss: 0.043\n", "epoch: 69, batch: 2800 // loss: 0.046\n", "epoch: 69, batch: 2900 // loss: 0.042\n", "epoch: 69, batch: 3000 // loss: 0.046\n", "epoch: 69, batch: 3100 // loss: 0.043\n", "epoch: 69, batch: 3200 // loss: 0.039\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 69, batch: 3300 // loss: 0.038\n", "epoch: 69, batch: 3400 // loss: 0.044\n", "epoch: 69, batch: 3500 // loss: 0.035\n", "epoch: 69, batch: 3600 // loss: 0.043\n", "epoch: 69, batch: 3700 // loss: 0.044\n", "\n", "epoch: 70, batch: 0 // loss: 0.053\n", "epoch: 70, batch: 100 // loss: 0.047\n", "epoch: 70, batch: 200 // loss: 0.043\n", "epoch: 70, batch: 300 // loss: 0.049\n", "epoch: 70, batch: 400 // loss: 0.046\n", "epoch: 70, batch: 500 // loss: 0.040\n", "epoch: 70, batch: 600 // loss: 0.041\n", "epoch: 70, batch: 700 // loss: 0.044\n", "epoch: 70, batch: 800 // loss: 0.042\n", "epoch: 70, batch: 900 // loss: 0.049\n", "epoch: 70, batch: 1000 // loss: 0.046\n", "epoch: 70, batch: 1100 // loss: 0.043\n", "epoch: 70, batch: 1200 // loss: 0.044\n", "epoch: 70, batch: 1300 // loss: 0.046\n", "epoch: 70, batch: 1400 // loss: 0.043\n", "epoch: 70, batch: 1500 // loss: 0.048\n", "epoch: 70, batch: 1600 // loss: 0.052\n", "epoch: 70, batch: 1700 // loss: 0.045\n", "epoch: 70, batch: 1800 // loss: 0.053\n", "epoch: 70, batch: 1900 // loss: 0.045\n", "epoch: 70, batch: 2000 // loss: 0.047\n", "epoch: 70, batch: 2100 // loss: 0.047\n", "epoch: 70, batch: 2200 // loss: 0.050\n", "epoch: 70, batch: 2300 // loss: 0.049\n", "epoch: 70, batch: 2400 // loss: 0.042\n", "epoch: 70, batch: 2500 // loss: 0.043\n", "epoch: 70, batch: 2600 // loss: 0.045\n", "epoch: 70, batch: 2700 // loss: 0.043\n", "epoch: 70, batch: 2800 // loss: 0.046\n", "epoch: 70, batch: 2900 // loss: 0.042\n", "epoch: 70, batch: 3000 // loss: 0.046\n", "epoch: 70, batch: 3100 // loss: 0.043\n", "epoch: 70, batch: 3200 // loss: 0.039\n", "epoch: 70, batch: 3300 // loss: 0.038\n", "epoch: 70, batch: 3400 // loss: 0.044\n", "epoch: 70, batch: 3500 // loss: 0.035\n", "epoch: 70, batch: 3600 // loss: 0.043\n", "epoch: 70, batch: 3700 // loss: 0.044\n", "\n", "epoch: 71, batch: 0 // loss: 0.053\n", "epoch: 71, batch: 100 // loss: 0.046\n", "epoch: 71, batch: 200 // loss: 0.043\n", "epoch: 71, batch: 300 // loss: 0.049\n", "epoch: 71, batch: 400 // loss: 0.046\n", "epoch: 71, batch: 500 // loss: 0.040\n", "epoch: 71, batch: 600 // loss: 0.041\n", "epoch: 71, batch: 700 // loss: 0.044\n", "epoch: 71, batch: 800 // loss: 0.042\n", "epoch: 71, batch: 900 // loss: 0.049\n", "epoch: 71, batch: 1000 // loss: 0.046\n", "epoch: 71, batch: 1100 // loss: 0.043\n", "epoch: 71, batch: 1200 // loss: 0.044\n", "epoch: 71, batch: 1300 // loss: 0.046\n", "epoch: 71, batch: 1400 // loss: 0.043\n", "epoch: 71, batch: 1500 // loss: 0.048\n", "epoch: 71, batch: 1600 // loss: 0.052\n", "epoch: 71, batch: 1700 // loss: 0.045\n", "epoch: 71, batch: 1800 // loss: 0.053\n", "epoch: 71, batch: 1900 // loss: 0.045\n", "epoch: 71, batch: 2000 // loss: 0.047\n", "epoch: 71, batch: 2100 // loss: 0.047\n", "epoch: 71, batch: 2200 // loss: 0.050\n", "epoch: 71, batch: 2300 // loss: 0.049\n", "epoch: 71, batch: 2400 // loss: 0.042\n", "epoch: 71, batch: 2500 // loss: 0.043\n", "epoch: 71, batch: 2600 // loss: 0.045\n", "epoch: 71, batch: 2700 // loss: 0.043\n", "epoch: 71, batch: 2800 // loss: 0.046\n", "epoch: 71, batch: 2900 // loss: 0.042\n", "epoch: 71, batch: 3000 // loss: 0.046\n", "epoch: 71, batch: 3100 // loss: 0.043\n", "epoch: 71, batch: 3200 // loss: 0.039\n", "epoch: 71, batch: 3300 // loss: 0.038\n", "epoch: 71, batch: 3400 // loss: 0.044\n", "epoch: 71, batch: 3500 // loss: 0.035\n", "epoch: 71, batch: 3600 // loss: 0.043\n", "epoch: 71, batch: 3700 // loss: 0.043\n", "\n", "epoch: 72, batch: 0 // loss: 0.053\n", "epoch: 72, batch: 100 // loss: 0.046\n", "epoch: 72, batch: 200 // loss: 0.043\n", "epoch: 72, batch: 300 // loss: 0.049\n", "epoch: 72, batch: 400 // loss: 0.046\n", "epoch: 72, batch: 500 // loss: 0.040\n", "epoch: 72, batch: 600 // loss: 0.041\n", "epoch: 72, batch: 700 // loss: 0.044\n", "epoch: 72, batch: 800 // loss: 0.042\n", "epoch: 72, batch: 900 // loss: 0.049\n", "epoch: 72, batch: 1000 // loss: 0.046\n", "epoch: 72, batch: 1100 // loss: 0.043\n", "epoch: 72, batch: 1200 // loss: 0.044\n", "epoch: 72, batch: 1300 // loss: 0.046\n", "epoch: 72, batch: 1400 // loss: 0.043\n", "epoch: 72, batch: 1500 // loss: 0.048\n", "epoch: 72, batch: 1600 // loss: 0.052\n", "epoch: 72, batch: 1700 // loss: 0.045\n", "epoch: 72, batch: 1800 // loss: 0.053\n", "epoch: 72, batch: 1900 // loss: 0.045\n", "epoch: 72, batch: 2000 // loss: 0.047\n", "epoch: 72, batch: 2100 // loss: 0.047\n", "epoch: 72, batch: 2200 // loss: 0.050\n", "epoch: 72, batch: 2300 // loss: 0.049\n", "epoch: 72, batch: 2400 // loss: 0.042\n", "epoch: 72, batch: 2500 // loss: 0.043\n", "epoch: 72, batch: 2600 // loss: 0.045\n", "epoch: 72, batch: 2700 // loss: 0.043\n", "epoch: 72, batch: 2800 // loss: 0.046\n", "epoch: 72, batch: 2900 // loss: 0.042\n", "epoch: 72, batch: 3000 // loss: 0.046\n", "epoch: 72, batch: 3100 // loss: 0.043\n", "epoch: 72, batch: 3200 // loss: 0.039\n", "epoch: 72, batch: 3300 // loss: 0.038\n", "epoch: 72, batch: 3400 // loss: 0.044\n", "epoch: 72, batch: 3500 // loss: 0.035\n", "epoch: 72, batch: 3600 // loss: 0.043\n", "epoch: 72, batch: 3700 // loss: 0.043\n", "\n", "epoch: 73, batch: 0 // loss: 0.053\n", "epoch: 73, batch: 100 // loss: 0.046\n", "epoch: 73, batch: 200 // loss: 0.043\n", "epoch: 73, batch: 300 // loss: 0.049\n", "epoch: 73, batch: 400 // loss: 0.046\n", "epoch: 73, batch: 500 // loss: 0.040\n", "epoch: 73, batch: 600 // loss: 0.040\n", "epoch: 73, batch: 700 // loss: 0.044\n", "epoch: 73, batch: 800 // loss: 0.042\n", "epoch: 73, batch: 900 // loss: 0.049\n", "epoch: 73, batch: 1000 // loss: 0.046\n", "epoch: 73, batch: 1100 // loss: 0.043\n", "epoch: 73, batch: 1200 // loss: 0.044\n", "epoch: 73, batch: 1300 // loss: 0.046\n", "epoch: 73, batch: 1400 // loss: 0.043\n", "epoch: 73, batch: 1500 // loss: 0.048\n", "epoch: 73, batch: 1600 // loss: 0.052\n", "epoch: 73, batch: 1700 // loss: 0.045\n", "epoch: 73, batch: 1800 // loss: 0.053\n", "epoch: 73, batch: 1900 // loss: 0.045\n", "epoch: 73, batch: 2000 // loss: 0.047\n", "epoch: 73, batch: 2100 // loss: 0.047\n", "epoch: 73, batch: 2200 // loss: 0.050\n", "epoch: 73, batch: 2300 // loss: 0.049\n", "epoch: 73, batch: 2400 // loss: 0.042\n", "epoch: 73, batch: 2500 // loss: 0.042\n", "epoch: 73, batch: 2600 // loss: 0.045\n", "epoch: 73, batch: 2700 // loss: 0.043\n", "epoch: 73, batch: 2800 // loss: 0.046\n", "epoch: 73, batch: 2900 // loss: 0.042\n", "epoch: 73, batch: 3000 // loss: 0.046\n", "epoch: 73, batch: 3100 // loss: 0.043\n", "epoch: 73, batch: 3200 // loss: 0.039\n", "epoch: 73, batch: 3300 // loss: 0.038\n", "epoch: 73, batch: 3400 // loss: 0.044\n", "epoch: 73, batch: 3500 // loss: 0.035\n", "epoch: 73, batch: 3600 // loss: 0.043\n", "epoch: 73, batch: 3700 // loss: 0.043\n", "\n", "epoch: 74, batch: 0 // loss: 0.053\n", "epoch: 74, batch: 100 // loss: 0.046\n", "epoch: 74, batch: 200 // loss: 0.043\n", "epoch: 74, batch: 300 // loss: 0.049\n", "epoch: 74, batch: 400 // loss: 0.046\n", "epoch: 74, batch: 500 // loss: 0.040\n", "epoch: 74, batch: 600 // loss: 0.040\n", "epoch: 74, batch: 700 // loss: 0.044\n", "epoch: 74, batch: 800 // loss: 0.042\n", "epoch: 74, batch: 900 // loss: 0.049\n", "epoch: 74, batch: 1000 // loss: 0.046\n", "epoch: 74, batch: 1100 // loss: 0.043\n", "epoch: 74, batch: 1200 // loss: 0.044\n", "epoch: 74, batch: 1300 // loss: 0.046\n", "epoch: 74, batch: 1400 // loss: 0.043\n", "epoch: 74, batch: 1500 // loss: 0.048\n", "epoch: 74, batch: 1600 // loss: 0.052\n", "epoch: 74, batch: 1700 // loss: 0.045\n", "epoch: 74, batch: 1800 // loss: 0.053\n", "epoch: 74, batch: 1900 // loss: 0.045\n", "epoch: 74, batch: 2000 // loss: 0.047\n", "epoch: 74, batch: 2100 // loss: 0.047\n", "epoch: 74, batch: 2200 // loss: 0.050\n", "epoch: 74, batch: 2300 // loss: 0.049\n", "epoch: 74, batch: 2400 // loss: 0.042\n", "epoch: 74, batch: 2500 // loss: 0.042\n", "epoch: 74, batch: 2600 // loss: 0.045\n", "epoch: 74, batch: 2700 // loss: 0.043\n", "epoch: 74, batch: 2800 // loss: 0.046\n", "epoch: 74, batch: 2900 // loss: 0.042\n", "epoch: 74, batch: 3000 // loss: 0.046\n", "epoch: 74, batch: 3100 // loss: 0.043\n", "epoch: 74, batch: 3200 // loss: 0.039\n", "epoch: 74, batch: 3300 // loss: 0.038\n", "epoch: 74, batch: 3400 // loss: 0.044\n", "epoch: 74, batch: 3500 // loss: 0.035\n", "epoch: 74, batch: 3600 // loss: 0.043\n", "epoch: 74, batch: 3700 // loss: 0.043\n", "\n", "epoch: 75, batch: 0 // loss: 0.053\n", "epoch: 75, batch: 100 // loss: 0.046\n", "epoch: 75, batch: 200 // loss: 0.043\n", "epoch: 75, batch: 300 // loss: 0.049\n", "epoch: 75, batch: 400 // loss: 0.046\n", "epoch: 75, batch: 500 // loss: 0.040\n", "epoch: 75, batch: 600 // loss: 0.040\n", "epoch: 75, batch: 700 // loss: 0.044\n", "epoch: 75, batch: 800 // loss: 0.042\n", "epoch: 75, batch: 900 // loss: 0.049\n", "epoch: 75, batch: 1000 // loss: 0.046\n", "epoch: 75, batch: 1100 // loss: 0.043\n", "epoch: 75, batch: 1200 // loss: 0.044\n", "epoch: 75, batch: 1300 // loss: 0.046\n", "epoch: 75, batch: 1400 // loss: 0.043\n", "epoch: 75, batch: 1500 // loss: 0.048\n", "epoch: 75, batch: 1600 // loss: 0.052\n", "epoch: 75, batch: 1700 // loss: 0.045\n", "epoch: 75, batch: 1800 // loss: 0.053\n", "epoch: 75, batch: 1900 // loss: 0.045\n", "epoch: 75, batch: 2000 // loss: 0.047\n", "epoch: 75, batch: 2100 // loss: 0.047\n", "epoch: 75, batch: 2200 // loss: 0.050\n", "epoch: 75, batch: 2300 // loss: 0.049\n", "epoch: 75, batch: 2400 // loss: 0.042\n", "epoch: 75, batch: 2500 // loss: 0.042\n", "epoch: 75, batch: 2600 // loss: 0.045\n", "epoch: 75, batch: 2700 // loss: 0.043\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 75, batch: 2800 // loss: 0.046\n", "epoch: 75, batch: 2900 // loss: 0.042\n", "epoch: 75, batch: 3000 // loss: 0.046\n", "epoch: 75, batch: 3100 // loss: 0.043\n", "epoch: 75, batch: 3200 // loss: 0.039\n", "epoch: 75, batch: 3300 // loss: 0.038\n", "epoch: 75, batch: 3400 // loss: 0.044\n", "epoch: 75, batch: 3500 // loss: 0.035\n", "epoch: 75, batch: 3600 // loss: 0.043\n", "epoch: 75, batch: 3700 // loss: 0.043\n", "\n", "epoch: 76, batch: 0 // loss: 0.053\n", "epoch: 76, batch: 100 // loss: 0.046\n", "epoch: 76, batch: 200 // loss: 0.043\n", "epoch: 76, batch: 300 // loss: 0.049\n", "epoch: 76, batch: 400 // loss: 0.046\n", "epoch: 76, batch: 500 // loss: 0.040\n", "epoch: 76, batch: 600 // loss: 0.040\n", "epoch: 76, batch: 700 // loss: 0.044\n", "epoch: 76, batch: 800 // loss: 0.042\n", "epoch: 76, batch: 900 // loss: 0.049\n", "epoch: 76, batch: 1000 // loss: 0.046\n", "epoch: 76, batch: 1100 // loss: 0.043\n", "epoch: 76, batch: 1200 // loss: 0.044\n", "epoch: 76, batch: 1300 // loss: 0.046\n", "epoch: 76, batch: 1400 // loss: 0.043\n", "epoch: 76, batch: 1500 // loss: 0.048\n", "epoch: 76, batch: 1600 // loss: 0.052\n", "epoch: 76, batch: 1700 // loss: 0.045\n", "epoch: 76, batch: 1800 // loss: 0.053\n", "epoch: 76, batch: 1900 // loss: 0.045\n", "epoch: 76, batch: 2000 // loss: 0.047\n", "epoch: 76, batch: 2100 // loss: 0.047\n", "epoch: 76, batch: 2200 // loss: 0.050\n", "epoch: 76, batch: 2300 // loss: 0.049\n", "epoch: 76, batch: 2400 // loss: 0.042\n", "epoch: 76, batch: 2500 // loss: 0.042\n", "epoch: 76, batch: 2600 // loss: 0.045\n", "epoch: 76, batch: 2700 // loss: 0.043\n", "epoch: 76, batch: 2800 // loss: 0.046\n", "epoch: 76, batch: 2900 // loss: 0.042\n", "epoch: 76, batch: 3000 // loss: 0.046\n", "epoch: 76, batch: 3100 // loss: 0.043\n", "epoch: 76, batch: 3200 // loss: 0.039\n", "epoch: 76, batch: 3300 // loss: 0.038\n", "epoch: 76, batch: 3400 // loss: 0.044\n", "epoch: 76, batch: 3500 // loss: 0.035\n", "epoch: 76, batch: 3600 // loss: 0.043\n", "epoch: 76, batch: 3700 // loss: 0.043\n", "\n", "epoch: 77, batch: 0 // loss: 0.053\n", "epoch: 77, batch: 100 // loss: 0.046\n", "epoch: 77, batch: 200 // loss: 0.043\n", "epoch: 77, batch: 300 // loss: 0.049\n", "epoch: 77, batch: 400 // loss: 0.046\n", "epoch: 77, batch: 500 // loss: 0.040\n", "epoch: 77, batch: 600 // loss: 0.040\n", "epoch: 77, batch: 700 // loss: 0.044\n", "epoch: 77, batch: 800 // loss: 0.042\n", "epoch: 77, batch: 900 // loss: 0.049\n", "epoch: 77, batch: 1000 // loss: 0.046\n", "epoch: 77, batch: 1100 // loss: 0.043\n", "epoch: 77, batch: 1200 // loss: 0.044\n", "epoch: 77, batch: 1300 // loss: 0.046\n", "epoch: 77, batch: 1400 // loss: 0.043\n", "epoch: 77, batch: 1500 // loss: 0.048\n", "epoch: 77, batch: 1600 // loss: 0.052\n", "epoch: 77, batch: 1700 // loss: 0.045\n", "epoch: 77, batch: 1800 // loss: 0.053\n", "epoch: 77, batch: 1900 // loss: 0.045\n", "epoch: 77, batch: 2000 // loss: 0.047\n", "epoch: 77, batch: 2100 // loss: 0.047\n", "epoch: 77, batch: 2200 // loss: 0.050\n", "epoch: 77, batch: 2300 // loss: 0.049\n", "epoch: 77, batch: 2400 // loss: 0.042\n", "epoch: 77, batch: 2500 // loss: 0.042\n", "epoch: 77, batch: 2600 // loss: 0.045\n", "epoch: 77, batch: 2700 // loss: 0.043\n", "epoch: 77, batch: 2800 // loss: 0.046\n", "epoch: 77, batch: 2900 // loss: 0.042\n", "epoch: 77, batch: 3000 // loss: 0.045\n", "epoch: 77, batch: 3100 // loss: 0.043\n", "epoch: 77, batch: 3200 // loss: 0.039\n", "epoch: 77, batch: 3300 // loss: 0.038\n", "epoch: 77, batch: 3400 // loss: 0.044\n", "epoch: 77, batch: 3500 // loss: 0.035\n", "epoch: 77, batch: 3600 // loss: 0.043\n", "epoch: 77, batch: 3700 // loss: 0.043\n", "\n", "epoch: 78, batch: 0 // loss: 0.053\n", "epoch: 78, batch: 100 // loss: 0.046\n", "epoch: 78, batch: 200 // loss: 0.043\n", "epoch: 78, batch: 300 // loss: 0.049\n", "epoch: 78, batch: 400 // loss: 0.046\n", "epoch: 78, batch: 500 // loss: 0.040\n", "epoch: 78, batch: 600 // loss: 0.040\n", "epoch: 78, batch: 700 // loss: 0.044\n", "epoch: 78, batch: 800 // loss: 0.042\n", "epoch: 78, batch: 900 // loss: 0.049\n", "epoch: 78, batch: 1000 // loss: 0.046\n", "epoch: 78, batch: 1100 // loss: 0.043\n", "epoch: 78, batch: 1200 // loss: 0.044\n", "epoch: 78, batch: 1300 // loss: 0.046\n", "epoch: 78, batch: 1400 // loss: 0.043\n", "epoch: 78, batch: 1500 // loss: 0.048\n", "epoch: 78, batch: 1600 // loss: 0.052\n", "epoch: 78, batch: 1700 // loss: 0.045\n", "epoch: 78, batch: 1800 // loss: 0.053\n", "epoch: 78, batch: 1900 // loss: 0.045\n", "epoch: 78, batch: 2000 // loss: 0.047\n", "epoch: 78, batch: 2100 // loss: 0.047\n", "epoch: 78, batch: 2200 // loss: 0.050\n", "epoch: 78, batch: 2300 // loss: 0.049\n", "epoch: 78, batch: 2400 // loss: 0.042\n", "epoch: 78, batch: 2500 // loss: 0.042\n", "epoch: 78, batch: 2600 // loss: 0.045\n", "epoch: 78, batch: 2700 // loss: 0.043\n", "epoch: 78, batch: 2800 // loss: 0.046\n", "epoch: 78, batch: 2900 // loss: 0.042\n", "epoch: 78, batch: 3000 // loss: 0.045\n", "epoch: 78, batch: 3100 // loss: 0.043\n", "epoch: 78, batch: 3200 // loss: 0.039\n", "epoch: 78, batch: 3300 // loss: 0.038\n", "epoch: 78, batch: 3400 // loss: 0.044\n", "epoch: 78, batch: 3500 // loss: 0.035\n", "epoch: 78, batch: 3600 // loss: 0.043\n", "epoch: 78, batch: 3700 // loss: 0.043\n", "\n", "epoch: 79, batch: 0 // loss: 0.053\n", "epoch: 79, batch: 100 // loss: 0.046\n", "epoch: 79, batch: 200 // loss: 0.043\n", "epoch: 79, batch: 300 // loss: 0.049\n", "epoch: 79, batch: 400 // loss: 0.046\n", "epoch: 79, batch: 500 // loss: 0.040\n", "epoch: 79, batch: 600 // loss: 0.040\n", "epoch: 79, batch: 700 // loss: 0.044\n", "epoch: 79, batch: 800 // loss: 0.042\n", "epoch: 79, batch: 900 // loss: 0.049\n", "epoch: 79, batch: 1000 // loss: 0.046\n", "epoch: 79, batch: 1100 // loss: 0.043\n", "epoch: 79, batch: 1200 // loss: 0.044\n", "epoch: 79, batch: 1300 // loss: 0.046\n", "epoch: 79, batch: 1400 // loss: 0.043\n", "epoch: 79, batch: 1500 // loss: 0.048\n", "epoch: 79, batch: 1600 // loss: 0.052\n", "epoch: 79, batch: 1700 // loss: 0.045\n", "epoch: 79, batch: 1800 // loss: 0.053\n", "epoch: 79, batch: 1900 // loss: 0.045\n", "epoch: 79, batch: 2000 // loss: 0.047\n", "epoch: 79, batch: 2100 // loss: 0.047\n", "epoch: 79, batch: 2200 // loss: 0.050\n", "epoch: 79, batch: 2300 // loss: 0.049\n", "epoch: 79, batch: 2400 // loss: 0.042\n", "epoch: 79, batch: 2500 // loss: 0.042\n", "epoch: 79, batch: 2600 // loss: 0.045\n", "epoch: 79, batch: 2700 // loss: 0.043\n", "epoch: 79, batch: 2800 // loss: 0.046\n", "epoch: 79, batch: 2900 // loss: 0.042\n", "epoch: 79, batch: 3000 // loss: 0.045\n", "epoch: 79, batch: 3100 // loss: 0.043\n", "epoch: 79, batch: 3200 // loss: 0.039\n", "epoch: 79, batch: 3300 // loss: 0.038\n", "epoch: 79, batch: 3400 // loss: 0.044\n", "epoch: 79, batch: 3500 // loss: 0.035\n", "epoch: 79, batch: 3600 // loss: 0.043\n", "epoch: 79, batch: 3700 // loss: 0.043\n", "\n", "epoch: 80, batch: 0 // loss: 0.053\n", "epoch: 80, batch: 100 // loss: 0.046\n", "epoch: 80, batch: 200 // loss: 0.043\n", "epoch: 80, batch: 300 // loss: 0.049\n", "epoch: 80, batch: 400 // loss: 0.046\n", "epoch: 80, batch: 500 // loss: 0.040\n", "epoch: 80, batch: 600 // loss: 0.040\n", "epoch: 80, batch: 700 // loss: 0.044\n", "epoch: 80, batch: 800 // loss: 0.042\n", "epoch: 80, batch: 900 // loss: 0.049\n", "epoch: 80, batch: 1000 // loss: 0.046\n", "epoch: 80, batch: 1100 // loss: 0.043\n", "epoch: 80, batch: 1200 // loss: 0.044\n", "epoch: 80, batch: 1300 // loss: 0.046\n", "epoch: 80, batch: 1400 // loss: 0.043\n", "epoch: 80, batch: 1500 // loss: 0.048\n", "epoch: 80, batch: 1600 // loss: 0.052\n", "epoch: 80, batch: 1700 // loss: 0.045\n", "epoch: 80, batch: 1800 // loss: 0.053\n", "epoch: 80, batch: 1900 // loss: 0.045\n", "epoch: 80, batch: 2000 // loss: 0.047\n", "epoch: 80, batch: 2100 // loss: 0.047\n", "epoch: 80, batch: 2200 // loss: 0.050\n", "epoch: 80, batch: 2300 // loss: 0.049\n", "epoch: 80, batch: 2400 // loss: 0.042\n", "epoch: 80, batch: 2500 // loss: 0.042\n", "epoch: 80, batch: 2600 // loss: 0.045\n", "epoch: 80, batch: 2700 // loss: 0.043\n", "epoch: 80, batch: 2800 // loss: 0.046\n", "epoch: 80, batch: 2900 // loss: 0.042\n", "epoch: 80, batch: 3000 // loss: 0.045\n", "epoch: 80, batch: 3100 // loss: 0.043\n", "epoch: 80, batch: 3200 // loss: 0.039\n", "epoch: 80, batch: 3300 // loss: 0.038\n", "epoch: 80, batch: 3400 // loss: 0.044\n", "epoch: 80, batch: 3500 // loss: 0.035\n", "epoch: 80, batch: 3600 // loss: 0.043\n", "epoch: 80, batch: 3700 // loss: 0.043\n", "\n", "epoch: 81, batch: 0 // loss: 0.053\n", "epoch: 81, batch: 100 // loss: 0.046\n", "epoch: 81, batch: 200 // loss: 0.043\n", "epoch: 81, batch: 300 // loss: 0.049\n", "epoch: 81, batch: 400 // loss: 0.046\n", "epoch: 81, batch: 500 // loss: 0.040\n", "epoch: 81, batch: 600 // loss: 0.040\n", "epoch: 81, batch: 700 // loss: 0.044\n", "epoch: 81, batch: 800 // loss: 0.042\n", "epoch: 81, batch: 900 // loss: 0.049\n", "epoch: 81, batch: 1000 // loss: 0.046\n", "epoch: 81, batch: 1100 // loss: 0.043\n", "epoch: 81, batch: 1200 // loss: 0.044\n", "epoch: 81, batch: 1300 // loss: 0.046\n", "epoch: 81, batch: 1400 // loss: 0.043\n", "epoch: 81, batch: 1500 // loss: 0.048\n", "epoch: 81, batch: 1600 // loss: 0.052\n", "epoch: 81, batch: 1700 // loss: 0.045\n", "epoch: 81, batch: 1800 // loss: 0.053\n", "epoch: 81, batch: 1900 // loss: 0.045\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 81, batch: 2000 // loss: 0.047\n", "epoch: 81, batch: 2100 // loss: 0.047\n", "epoch: 81, batch: 2200 // loss: 0.050\n", "epoch: 81, batch: 2300 // loss: 0.049\n", "epoch: 81, batch: 2400 // loss: 0.042\n", "epoch: 81, batch: 2500 // loss: 0.042\n", "epoch: 81, batch: 2600 // loss: 0.045\n", "epoch: 81, batch: 2700 // loss: 0.042\n", "epoch: 81, batch: 2800 // loss: 0.046\n", "epoch: 81, batch: 2900 // loss: 0.042\n", "epoch: 81, batch: 3000 // loss: 0.045\n", "epoch: 81, batch: 3100 // loss: 0.043\n", "epoch: 81, batch: 3200 // loss: 0.039\n", "epoch: 81, batch: 3300 // loss: 0.038\n", "epoch: 81, batch: 3400 // loss: 0.044\n", "epoch: 81, batch: 3500 // loss: 0.035\n", "epoch: 81, batch: 3600 // loss: 0.043\n", "epoch: 81, batch: 3700 // loss: 0.043\n", "\n", "epoch: 82, batch: 0 // loss: 0.053\n", "epoch: 82, batch: 100 // loss: 0.046\n", "epoch: 82, batch: 200 // loss: 0.043\n", "epoch: 82, batch: 300 // loss: 0.049\n", "epoch: 82, batch: 400 // loss: 0.046\n", "epoch: 82, batch: 500 // loss: 0.040\n", "epoch: 82, batch: 600 // loss: 0.040\n", "epoch: 82, batch: 700 // loss: 0.044\n", "epoch: 82, batch: 800 // loss: 0.042\n", "epoch: 82, batch: 900 // loss: 0.049\n", "epoch: 82, batch: 1000 // loss: 0.046\n", "epoch: 82, batch: 1100 // loss: 0.043\n", "epoch: 82, batch: 1200 // loss: 0.044\n", "epoch: 82, batch: 1300 // loss: 0.046\n", "epoch: 82, batch: 1400 // loss: 0.043\n", "epoch: 82, batch: 1500 // loss: 0.048\n", "epoch: 82, batch: 1600 // loss: 0.052\n", "epoch: 82, batch: 1700 // loss: 0.045\n", "epoch: 82, batch: 1800 // loss: 0.053\n", "epoch: 82, batch: 1900 // loss: 0.045\n", "epoch: 82, batch: 2000 // loss: 0.047\n", "epoch: 82, batch: 2100 // loss: 0.047\n", "epoch: 82, batch: 2200 // loss: 0.050\n", "epoch: 82, batch: 2300 // loss: 0.049\n", "epoch: 82, batch: 2400 // loss: 0.042\n", "epoch: 82, batch: 2500 // loss: 0.042\n", "epoch: 82, batch: 2600 // loss: 0.045\n", "epoch: 82, batch: 2700 // loss: 0.042\n", "epoch: 82, batch: 2800 // loss: 0.046\n", "epoch: 82, batch: 2900 // loss: 0.042\n", "epoch: 82, batch: 3000 // loss: 0.045\n", "epoch: 82, batch: 3100 // loss: 0.043\n", "epoch: 82, batch: 3200 // loss: 0.039\n", "epoch: 82, batch: 3300 // loss: 0.038\n", "epoch: 82, batch: 3400 // loss: 0.044\n", "epoch: 82, batch: 3500 // loss: 0.035\n", "epoch: 82, batch: 3600 // loss: 0.043\n", "epoch: 82, batch: 3700 // loss: 0.043\n", "\n", "epoch: 83, batch: 0 // loss: 0.053\n", "epoch: 83, batch: 100 // loss: 0.046\n", "epoch: 83, batch: 200 // loss: 0.043\n", "epoch: 83, batch: 300 // loss: 0.049\n", "epoch: 83, batch: 400 // loss: 0.046\n", "epoch: 83, batch: 500 // loss: 0.040\n", "epoch: 83, batch: 600 // loss: 0.040\n", "epoch: 83, batch: 700 // loss: 0.044\n", "epoch: 83, batch: 800 // loss: 0.042\n", "epoch: 83, batch: 900 // loss: 0.049\n", "epoch: 83, batch: 1000 // loss: 0.046\n", "epoch: 83, batch: 1100 // loss: 0.042\n", "epoch: 83, batch: 1200 // loss: 0.044\n", "epoch: 83, batch: 1300 // loss: 0.046\n", "epoch: 83, batch: 1400 // loss: 0.043\n", "epoch: 83, batch: 1500 // loss: 0.048\n", "epoch: 83, batch: 1600 // loss: 0.052\n", "epoch: 83, batch: 1700 // loss: 0.045\n", "epoch: 83, batch: 1800 // loss: 0.053\n", "epoch: 83, batch: 1900 // loss: 0.045\n", "epoch: 83, batch: 2000 // loss: 0.047\n", "epoch: 83, batch: 2100 // loss: 0.047\n", "epoch: 83, batch: 2200 // loss: 0.050\n", "epoch: 83, batch: 2300 // loss: 0.049\n", "epoch: 83, batch: 2400 // loss: 0.042\n", "epoch: 83, batch: 2500 // loss: 0.042\n", "epoch: 83, batch: 2600 // loss: 0.045\n", "epoch: 83, batch: 2700 // loss: 0.042\n", "epoch: 83, batch: 2800 // loss: 0.046\n", "epoch: 83, batch: 2900 // loss: 0.042\n", "epoch: 83, batch: 3000 // loss: 0.045\n", "epoch: 83, batch: 3100 // loss: 0.043\n", "epoch: 83, batch: 3200 // loss: 0.039\n", "epoch: 83, batch: 3300 // loss: 0.038\n", "epoch: 83, batch: 3400 // loss: 0.044\n", "epoch: 83, batch: 3500 // loss: 0.035\n", "epoch: 83, batch: 3600 // loss: 0.043\n", "epoch: 83, batch: 3700 // loss: 0.043\n", "\n", "epoch: 84, batch: 0 // loss: 0.053\n", "epoch: 84, batch: 100 // loss: 0.046\n", "epoch: 84, batch: 200 // loss: 0.043\n", "epoch: 84, batch: 300 // loss: 0.049\n", "epoch: 84, batch: 400 // loss: 0.046\n", "epoch: 84, batch: 500 // loss: 0.040\n", "epoch: 84, batch: 600 // loss: 0.040\n", "epoch: 84, batch: 700 // loss: 0.044\n", "epoch: 84, batch: 800 // loss: 0.042\n", "epoch: 84, batch: 900 // loss: 0.049\n", "epoch: 84, batch: 1000 // loss: 0.046\n", "epoch: 84, batch: 1100 // loss: 0.042\n", "epoch: 84, batch: 1200 // loss: 0.044\n", "epoch: 84, batch: 1300 // loss: 0.046\n", "epoch: 84, batch: 1400 // loss: 0.043\n", "epoch: 84, batch: 1500 // loss: 0.048\n", "epoch: 84, batch: 1600 // loss: 0.052\n", "epoch: 84, batch: 1700 // loss: 0.045\n", "epoch: 84, batch: 1800 // loss: 0.053\n", "epoch: 84, batch: 1900 // loss: 0.045\n", "epoch: 84, batch: 2000 // loss: 0.047\n", "epoch: 84, batch: 2100 // loss: 0.047\n", "epoch: 84, batch: 2200 // loss: 0.050\n", "epoch: 84, batch: 2300 // loss: 0.049\n", "epoch: 84, batch: 2400 // loss: 0.042\n", "epoch: 84, batch: 2500 // loss: 0.042\n", "epoch: 84, batch: 2600 // loss: 0.045\n", "epoch: 84, batch: 2700 // loss: 0.042\n", "epoch: 84, batch: 2800 // loss: 0.046\n", "epoch: 84, batch: 2900 // loss: 0.042\n", "epoch: 84, batch: 3000 // loss: 0.045\n", "epoch: 84, batch: 3100 // loss: 0.043\n", "epoch: 84, batch: 3200 // loss: 0.039\n", "epoch: 84, batch: 3300 // loss: 0.038\n", "epoch: 84, batch: 3400 // loss: 0.044\n", "epoch: 84, batch: 3500 // loss: 0.035\n", "epoch: 84, batch: 3600 // loss: 0.043\n", "epoch: 84, batch: 3700 // loss: 0.043\n", "\n", "epoch: 85, batch: 0 // loss: 0.053\n", "epoch: 85, batch: 100 // loss: 0.046\n", "epoch: 85, batch: 200 // loss: 0.043\n", "epoch: 85, batch: 300 // loss: 0.049\n", "epoch: 85, batch: 400 // loss: 0.046\n", "epoch: 85, batch: 500 // loss: 0.040\n", "epoch: 85, batch: 600 // loss: 0.040\n", "epoch: 85, batch: 700 // loss: 0.044\n", "epoch: 85, batch: 800 // loss: 0.042\n", "epoch: 85, batch: 900 // loss: 0.049\n", "epoch: 85, batch: 1000 // loss: 0.046\n", "epoch: 85, batch: 1100 // loss: 0.042\n", "epoch: 85, batch: 1200 // loss: 0.044\n", "epoch: 85, batch: 1300 // loss: 0.046\n", "epoch: 85, batch: 1400 // loss: 0.043\n", "epoch: 85, batch: 1500 // loss: 0.048\n", "epoch: 85, batch: 1600 // loss: 0.052\n", "epoch: 85, batch: 1700 // loss: 0.045\n", "epoch: 85, batch: 1800 // loss: 0.053\n", "epoch: 85, batch: 1900 // loss: 0.045\n", "epoch: 85, batch: 2000 // loss: 0.047\n", "epoch: 85, batch: 2100 // loss: 0.046\n", "epoch: 85, batch: 2200 // loss: 0.050\n", "epoch: 85, batch: 2300 // loss: 0.049\n", "epoch: 85, batch: 2400 // loss: 0.042\n", "epoch: 85, batch: 2500 // loss: 0.042\n", "epoch: 85, batch: 2600 // loss: 0.045\n", "epoch: 85, batch: 2700 // loss: 0.042\n", "epoch: 85, batch: 2800 // loss: 0.046\n", "epoch: 85, batch: 2900 // loss: 0.042\n", "epoch: 85, batch: 3000 // loss: 0.045\n", "epoch: 85, batch: 3100 // loss: 0.043\n", "epoch: 85, batch: 3200 // loss: 0.039\n", "epoch: 85, batch: 3300 // loss: 0.038\n", "epoch: 85, batch: 3400 // loss: 0.044\n", "epoch: 85, batch: 3500 // loss: 0.035\n", "epoch: 85, batch: 3600 // loss: 0.043\n", "epoch: 85, batch: 3700 // loss: 0.043\n", "\n", "epoch: 86, batch: 0 // loss: 0.053\n", "epoch: 86, batch: 100 // loss: 0.046\n", "epoch: 86, batch: 200 // loss: 0.043\n", "epoch: 86, batch: 300 // loss: 0.049\n", "epoch: 86, batch: 400 // loss: 0.046\n", "epoch: 86, batch: 500 // loss: 0.040\n", "epoch: 86, batch: 600 // loss: 0.040\n", "epoch: 86, batch: 700 // loss: 0.044\n", "epoch: 86, batch: 800 // loss: 0.042\n", "epoch: 86, batch: 900 // loss: 0.049\n", "epoch: 86, batch: 1000 // loss: 0.046\n", "epoch: 86, batch: 1100 // loss: 0.042\n", "epoch: 86, batch: 1200 // loss: 0.044\n", "epoch: 86, batch: 1300 // loss: 0.046\n", "epoch: 86, batch: 1400 // loss: 0.043\n", "epoch: 86, batch: 1500 // loss: 0.048\n", "epoch: 86, batch: 1600 // loss: 0.052\n", "epoch: 86, batch: 1700 // loss: 0.045\n", "epoch: 86, batch: 1800 // loss: 0.053\n", "epoch: 86, batch: 1900 // loss: 0.045\n", "epoch: 86, batch: 2000 // loss: 0.047\n", "epoch: 86, batch: 2100 // loss: 0.046\n", "epoch: 86, batch: 2200 // loss: 0.050\n", "epoch: 86, batch: 2300 // loss: 0.049\n", "epoch: 86, batch: 2400 // loss: 0.042\n", "epoch: 86, batch: 2500 // loss: 0.042\n", "epoch: 86, batch: 2600 // loss: 0.045\n", "epoch: 86, batch: 2700 // loss: 0.042\n", "epoch: 86, batch: 2800 // loss: 0.046\n", "epoch: 86, batch: 2900 // loss: 0.042\n", "epoch: 86, batch: 3000 // loss: 0.045\n", "epoch: 86, batch: 3100 // loss: 0.043\n", "epoch: 86, batch: 3200 // loss: 0.039\n", "epoch: 86, batch: 3300 // loss: 0.038\n", "epoch: 86, batch: 3400 // loss: 0.044\n", "epoch: 86, batch: 3500 // loss: 0.035\n", "epoch: 86, batch: 3600 // loss: 0.043\n", "epoch: 86, batch: 3700 // loss: 0.043\n", "\n", "epoch: 87, batch: 0 // loss: 0.053\n", "epoch: 87, batch: 100 // loss: 0.046\n", "epoch: 87, batch: 200 // loss: 0.043\n", "epoch: 87, batch: 300 // loss: 0.049\n", "epoch: 87, batch: 400 // loss: 0.046\n", "epoch: 87, batch: 500 // loss: 0.040\n", "epoch: 87, batch: 600 // loss: 0.040\n", "epoch: 87, batch: 700 // loss: 0.044\n", "epoch: 87, batch: 800 // loss: 0.042\n", "epoch: 87, batch: 900 // loss: 0.049\n", "epoch: 87, batch: 1000 // loss: 0.046\n", "epoch: 87, batch: 1100 // loss: 0.042\n", "epoch: 87, batch: 1200 // loss: 0.044\n", "epoch: 87, batch: 1300 // loss: 0.046\n", "epoch: 87, batch: 1400 // loss: 0.043\n", "epoch: 87, batch: 1500 // loss: 0.048\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 87, batch: 1600 // loss: 0.052\n", "epoch: 87, batch: 1700 // loss: 0.045\n", "epoch: 87, batch: 1800 // loss: 0.053\n", "epoch: 87, batch: 1900 // loss: 0.045\n", "epoch: 87, batch: 2000 // loss: 0.047\n", "epoch: 87, batch: 2100 // loss: 0.046\n", "epoch: 87, batch: 2200 // loss: 0.050\n", "epoch: 87, batch: 2300 // loss: 0.049\n", "epoch: 87, batch: 2400 // loss: 0.042\n", "epoch: 87, batch: 2500 // loss: 0.042\n", "epoch: 87, batch: 2600 // loss: 0.045\n", "epoch: 87, batch: 2700 // loss: 0.042\n", "epoch: 87, batch: 2800 // loss: 0.046\n", "epoch: 87, batch: 2900 // loss: 0.042\n", "epoch: 87, batch: 3000 // loss: 0.045\n", "epoch: 87, batch: 3100 // loss: 0.043\n", "epoch: 87, batch: 3200 // loss: 0.039\n", "epoch: 87, batch: 3300 // loss: 0.038\n", "epoch: 87, batch: 3400 // loss: 0.044\n", "epoch: 87, batch: 3500 // loss: 0.035\n", "epoch: 87, batch: 3600 // loss: 0.043\n", "epoch: 87, batch: 3700 // loss: 0.043\n", "\n", "epoch: 88, batch: 0 // loss: 0.053\n", "epoch: 88, batch: 100 // loss: 0.046\n", "epoch: 88, batch: 200 // loss: 0.043\n", "epoch: 88, batch: 300 // loss: 0.049\n", "epoch: 88, batch: 400 // loss: 0.046\n", "epoch: 88, batch: 500 // loss: 0.040\n", "epoch: 88, batch: 600 // loss: 0.040\n", "epoch: 88, batch: 700 // loss: 0.044\n", "epoch: 88, batch: 800 // loss: 0.042\n", "epoch: 88, batch: 900 // loss: 0.049\n", "epoch: 88, batch: 1000 // loss: 0.046\n", "epoch: 88, batch: 1100 // loss: 0.042\n", "epoch: 88, batch: 1200 // loss: 0.044\n", "epoch: 88, batch: 1300 // loss: 0.046\n", "epoch: 88, batch: 1400 // loss: 0.043\n", "epoch: 88, batch: 1500 // loss: 0.048\n", "epoch: 88, batch: 1600 // loss: 0.052\n", "epoch: 88, batch: 1700 // loss: 0.045\n", "epoch: 88, batch: 1800 // loss: 0.053\n", "epoch: 88, batch: 1900 // loss: 0.045\n", "epoch: 88, batch: 2000 // loss: 0.047\n", "epoch: 88, batch: 2100 // loss: 0.046\n", "epoch: 88, batch: 2200 // loss: 0.050\n", "epoch: 88, batch: 2300 // loss: 0.049\n", "epoch: 88, batch: 2400 // loss: 0.042\n", "epoch: 88, batch: 2500 // loss: 0.042\n", "epoch: 88, batch: 2600 // loss: 0.045\n", "epoch: 88, batch: 2700 // loss: 0.042\n", "epoch: 88, batch: 2800 // loss: 0.046\n", "epoch: 88, batch: 2900 // loss: 0.042\n", "epoch: 88, batch: 3000 // loss: 0.045\n", "epoch: 88, batch: 3100 // loss: 0.043\n", "epoch: 88, batch: 3200 // loss: 0.039\n", "epoch: 88, batch: 3300 // loss: 0.038\n", "epoch: 88, batch: 3400 // loss: 0.044\n", "epoch: 88, batch: 3500 // loss: 0.035\n", "epoch: 88, batch: 3600 // loss: 0.043\n", "epoch: 88, batch: 3700 // loss: 0.043\n", "\n", "epoch: 89, batch: 0 // loss: 0.053\n", "epoch: 89, batch: 100 // loss: 0.046\n", "epoch: 89, batch: 200 // loss: 0.043\n", "epoch: 89, batch: 300 // loss: 0.049\n", "epoch: 89, batch: 400 // loss: 0.046\n", "epoch: 89, batch: 500 // loss: 0.040\n", "epoch: 89, batch: 600 // loss: 0.040\n", "epoch: 89, batch: 700 // loss: 0.044\n", "epoch: 89, batch: 800 // loss: 0.042\n", "epoch: 89, batch: 900 // loss: 0.049\n", "epoch: 89, batch: 1000 // loss: 0.046\n", "epoch: 89, batch: 1100 // loss: 0.042\n", "epoch: 89, batch: 1200 // loss: 0.044\n", "epoch: 89, batch: 1300 // loss: 0.046\n", "epoch: 89, batch: 1400 // loss: 0.043\n", "epoch: 89, batch: 1500 // loss: 0.048\n", "epoch: 89, batch: 1600 // loss: 0.052\n", "epoch: 89, batch: 1700 // loss: 0.045\n", "epoch: 89, batch: 1800 // loss: 0.053\n", "epoch: 89, batch: 1900 // loss: 0.045\n", "epoch: 89, batch: 2000 // loss: 0.047\n", "epoch: 89, batch: 2100 // loss: 0.046\n", "epoch: 89, batch: 2200 // loss: 0.050\n", "epoch: 89, batch: 2300 // loss: 0.049\n", "epoch: 89, batch: 2400 // loss: 0.042\n", "epoch: 89, batch: 2500 // loss: 0.042\n", "epoch: 89, batch: 2600 // loss: 0.045\n", "epoch: 89, batch: 2700 // loss: 0.042\n", "epoch: 89, batch: 2800 // loss: 0.046\n", "epoch: 89, batch: 2900 // loss: 0.042\n", "epoch: 89, batch: 3000 // loss: 0.045\n", "epoch: 89, batch: 3100 // loss: 0.043\n", "epoch: 89, batch: 3200 // loss: 0.039\n", "epoch: 89, batch: 3300 // loss: 0.038\n", "epoch: 89, batch: 3400 // loss: 0.044\n", "epoch: 89, batch: 3500 // loss: 0.035\n", "epoch: 89, batch: 3600 // loss: 0.043\n", "epoch: 89, batch: 3700 // loss: 0.043\n", "\n", "epoch: 90, batch: 0 // loss: 0.053\n", "epoch: 90, batch: 100 // loss: 0.046\n", "epoch: 90, batch: 200 // loss: 0.043\n", "epoch: 90, batch: 300 // loss: 0.049\n", "epoch: 90, batch: 400 // loss: 0.046\n", "epoch: 90, batch: 500 // loss: 0.040\n", "epoch: 90, batch: 600 // loss: 0.040\n", "epoch: 90, batch: 700 // loss: 0.044\n", "epoch: 90, batch: 800 // loss: 0.042\n", "epoch: 90, batch: 900 // loss: 0.049\n", "epoch: 90, batch: 1000 // loss: 0.046\n", "epoch: 90, batch: 1100 // loss: 0.042\n", "epoch: 90, batch: 1200 // loss: 0.044\n", "epoch: 90, batch: 1300 // loss: 0.046\n", "epoch: 90, batch: 1400 // loss: 0.043\n", "epoch: 90, batch: 1500 // loss: 0.048\n", "epoch: 90, batch: 1600 // loss: 0.052\n", "epoch: 90, batch: 1700 // loss: 0.045\n", "epoch: 90, batch: 1800 // loss: 0.053\n", "epoch: 90, batch: 1900 // loss: 0.045\n", "epoch: 90, batch: 2000 // loss: 0.047\n", "epoch: 90, batch: 2100 // loss: 0.046\n", "epoch: 90, batch: 2200 // loss: 0.050\n", "epoch: 90, batch: 2300 // loss: 0.049\n", "epoch: 90, batch: 2400 // loss: 0.042\n", "epoch: 90, batch: 2500 // loss: 0.042\n", "epoch: 90, batch: 2600 // loss: 0.045\n", "epoch: 90, batch: 2700 // loss: 0.042\n", "epoch: 90, batch: 2800 // loss: 0.046\n", "epoch: 90, batch: 2900 // loss: 0.042\n", "epoch: 90, batch: 3000 // loss: 0.045\n", "epoch: 90, batch: 3100 // loss: 0.043\n", "epoch: 90, batch: 3200 // loss: 0.039\n", "epoch: 90, batch: 3300 // loss: 0.038\n", "epoch: 90, batch: 3400 // loss: 0.044\n", "epoch: 90, batch: 3500 // loss: 0.035\n", "epoch: 90, batch: 3600 // loss: 0.043\n", "epoch: 90, batch: 3700 // loss: 0.043\n", "\n", "epoch: 91, batch: 0 // loss: 0.053\n", "epoch: 91, batch: 100 // loss: 0.046\n", "epoch: 91, batch: 200 // loss: 0.043\n", "epoch: 91, batch: 300 // loss: 0.049\n", "epoch: 91, batch: 400 // loss: 0.046\n", "epoch: 91, batch: 500 // loss: 0.040\n", "epoch: 91, batch: 600 // loss: 0.040\n", "epoch: 91, batch: 700 // loss: 0.044\n", "epoch: 91, batch: 800 // loss: 0.042\n", "epoch: 91, batch: 900 // loss: 0.049\n", "epoch: 91, batch: 1000 // loss: 0.046\n", "epoch: 91, batch: 1100 // loss: 0.042\n", "epoch: 91, batch: 1200 // loss: 0.044\n", "epoch: 91, batch: 1300 // loss: 0.046\n", "epoch: 91, batch: 1400 // loss: 0.043\n", "epoch: 91, batch: 1500 // loss: 0.048\n", "epoch: 91, batch: 1600 // loss: 0.052\n", "epoch: 91, batch: 1700 // loss: 0.045\n", "epoch: 91, batch: 1800 // loss: 0.053\n", "epoch: 91, batch: 1900 // loss: 0.045\n", "epoch: 91, batch: 2000 // loss: 0.047\n", "epoch: 91, batch: 2100 // loss: 0.046\n", "epoch: 91, batch: 2200 // loss: 0.050\n", "epoch: 91, batch: 2300 // loss: 0.049\n", "epoch: 91, batch: 2400 // loss: 0.042\n", "epoch: 91, batch: 2500 // loss: 0.042\n", "epoch: 91, batch: 2600 // loss: 0.045\n", "epoch: 91, batch: 2700 // loss: 0.042\n", "epoch: 91, batch: 2800 // loss: 0.046\n", "epoch: 91, batch: 2900 // loss: 0.042\n", "epoch: 91, batch: 3000 // loss: 0.045\n", "epoch: 91, batch: 3100 // loss: 0.043\n", "epoch: 91, batch: 3200 // loss: 0.039\n", "epoch: 91, batch: 3300 // loss: 0.038\n", "epoch: 91, batch: 3400 // loss: 0.044\n", "epoch: 91, batch: 3500 // loss: 0.035\n", "epoch: 91, batch: 3600 // loss: 0.043\n", "epoch: 91, batch: 3700 // loss: 0.043\n", "\n", "epoch: 92, batch: 0 // loss: 0.053\n", "epoch: 92, batch: 100 // loss: 0.046\n", "epoch: 92, batch: 200 // loss: 0.043\n", "epoch: 92, batch: 300 // loss: 0.049\n", "epoch: 92, batch: 400 // loss: 0.046\n", "epoch: 92, batch: 500 // loss: 0.040\n", "epoch: 92, batch: 600 // loss: 0.040\n", "epoch: 92, batch: 700 // loss: 0.044\n", "epoch: 92, batch: 800 // loss: 0.042\n", "epoch: 92, batch: 900 // loss: 0.049\n", "epoch: 92, batch: 1000 // loss: 0.046\n", "epoch: 92, batch: 1100 // loss: 0.042\n", "epoch: 92, batch: 1200 // loss: 0.044\n", "epoch: 92, batch: 1300 // loss: 0.046\n", "epoch: 92, batch: 1400 // loss: 0.043\n", "epoch: 92, batch: 1500 // loss: 0.048\n", "epoch: 92, batch: 1600 // loss: 0.052\n", "epoch: 92, batch: 1700 // loss: 0.045\n", "epoch: 92, batch: 1800 // loss: 0.053\n", "epoch: 92, batch: 1900 // loss: 0.045\n", "epoch: 92, batch: 2000 // loss: 0.047\n", "epoch: 92, batch: 2100 // loss: 0.046\n", "epoch: 92, batch: 2200 // loss: 0.050\n", "epoch: 92, batch: 2300 // loss: 0.049\n", "epoch: 92, batch: 2400 // loss: 0.042\n", "epoch: 92, batch: 2500 // loss: 0.042\n", "epoch: 92, batch: 2600 // loss: 0.045\n", "epoch: 92, batch: 2700 // loss: 0.042\n", "epoch: 92, batch: 2800 // loss: 0.046\n", "epoch: 92, batch: 2900 // loss: 0.042\n", "epoch: 92, batch: 3000 // loss: 0.045\n", "epoch: 92, batch: 3100 // loss: 0.043\n", "epoch: 92, batch: 3200 // loss: 0.039\n", "epoch: 92, batch: 3300 // loss: 0.038\n", "epoch: 92, batch: 3400 // loss: 0.044\n", "epoch: 92, batch: 3500 // loss: 0.035\n", "epoch: 92, batch: 3600 // loss: 0.043\n", "epoch: 92, batch: 3700 // loss: 0.043\n", "\n", "epoch: 93, batch: 0 // loss: 0.053\n", "epoch: 93, batch: 100 // loss: 0.046\n", "epoch: 93, batch: 200 // loss: 0.043\n", "epoch: 93, batch: 300 // loss: 0.049\n", "epoch: 93, batch: 400 // loss: 0.046\n", "epoch: 93, batch: 500 // loss: 0.040\n", "epoch: 93, batch: 600 // loss: 0.040\n", "epoch: 93, batch: 700 // loss: 0.044\n", "epoch: 93, batch: 800 // loss: 0.042\n", "epoch: 93, batch: 900 // loss: 0.049\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 93, batch: 1000 // loss: 0.046\n", "epoch: 93, batch: 1100 // loss: 0.042\n", "epoch: 93, batch: 1200 // loss: 0.044\n", "epoch: 93, batch: 1300 // loss: 0.046\n", "epoch: 93, batch: 1400 // loss: 0.043\n", "epoch: 93, batch: 1500 // loss: 0.048\n", "epoch: 93, batch: 1600 // loss: 0.052\n", "epoch: 93, batch: 1700 // loss: 0.045\n", "epoch: 93, batch: 1800 // loss: 0.053\n", "epoch: 93, batch: 1900 // loss: 0.045\n", "epoch: 93, batch: 2000 // loss: 0.047\n", "epoch: 93, batch: 2100 // loss: 0.046\n", "epoch: 93, batch: 2200 // loss: 0.050\n", "epoch: 93, batch: 2300 // loss: 0.049\n", "epoch: 93, batch: 2400 // loss: 0.042\n", "epoch: 93, batch: 2500 // loss: 0.042\n", "epoch: 93, batch: 2600 // loss: 0.045\n", "epoch: 93, batch: 2700 // loss: 0.042\n", "epoch: 93, batch: 2800 // loss: 0.046\n", "epoch: 93, batch: 2900 // loss: 0.042\n", "epoch: 93, batch: 3000 // loss: 0.045\n", "epoch: 93, batch: 3100 // loss: 0.043\n", "epoch: 93, batch: 3200 // loss: 0.039\n", "epoch: 93, batch: 3300 // loss: 0.038\n", "epoch: 93, batch: 3400 // loss: 0.044\n", "epoch: 93, batch: 3500 // loss: 0.035\n", "epoch: 93, batch: 3600 // loss: 0.043\n", "epoch: 93, batch: 3700 // loss: 0.043\n", "\n", "epoch: 94, batch: 0 // loss: 0.053\n", "epoch: 94, batch: 100 // loss: 0.046\n", "epoch: 94, batch: 200 // loss: 0.043\n", "epoch: 94, batch: 300 // loss: 0.049\n", "epoch: 94, batch: 400 // loss: 0.046\n", "epoch: 94, batch: 500 // loss: 0.040\n", "epoch: 94, batch: 600 // loss: 0.040\n", "epoch: 94, batch: 700 // loss: 0.044\n", "epoch: 94, batch: 800 // loss: 0.042\n", "epoch: 94, batch: 900 // loss: 0.049\n", "epoch: 94, batch: 1000 // loss: 0.046\n", "epoch: 94, batch: 1100 // loss: 0.042\n", "epoch: 94, batch: 1200 // loss: 0.044\n", "epoch: 94, batch: 1300 // loss: 0.046\n", "epoch: 94, batch: 1400 // loss: 0.043\n", "epoch: 94, batch: 1500 // loss: 0.048\n", "epoch: 94, batch: 1600 // loss: 0.052\n", "epoch: 94, batch: 1700 // loss: 0.045\n", "epoch: 94, batch: 1800 // loss: 0.053\n", "epoch: 94, batch: 1900 // loss: 0.045\n", "epoch: 94, batch: 2000 // loss: 0.047\n", "epoch: 94, batch: 2100 // loss: 0.046\n", "epoch: 94, batch: 2200 // loss: 0.050\n", "epoch: 94, batch: 2300 // loss: 0.049\n", "epoch: 94, batch: 2400 // loss: 0.042\n", "epoch: 94, batch: 2500 // loss: 0.042\n", "epoch: 94, batch: 2600 // loss: 0.045\n", "epoch: 94, batch: 2700 // loss: 0.042\n", "epoch: 94, batch: 2800 // loss: 0.046\n", "epoch: 94, batch: 2900 // loss: 0.042\n", "epoch: 94, batch: 3000 // loss: 0.045\n", "epoch: 94, batch: 3100 // loss: 0.043\n", "epoch: 94, batch: 3200 // loss: 0.039\n", "epoch: 94, batch: 3300 // loss: 0.038\n", "epoch: 94, batch: 3400 // loss: 0.044\n", "epoch: 94, batch: 3500 // loss: 0.035\n", "epoch: 94, batch: 3600 // loss: 0.043\n", "epoch: 94, batch: 3700 // loss: 0.043\n", "\n", "epoch: 95, batch: 0 // loss: 0.053\n", "epoch: 95, batch: 100 // loss: 0.046\n", "epoch: 95, batch: 200 // loss: 0.043\n", "epoch: 95, batch: 300 // loss: 0.049\n", "epoch: 95, batch: 400 // loss: 0.046\n", "epoch: 95, batch: 500 // loss: 0.040\n", "epoch: 95, batch: 600 // loss: 0.040\n", "epoch: 95, batch: 700 // loss: 0.044\n", "epoch: 95, batch: 800 // loss: 0.042\n", "epoch: 95, batch: 900 // loss: 0.049\n", "epoch: 95, batch: 1000 // loss: 0.046\n", "epoch: 95, batch: 1100 // loss: 0.042\n", "epoch: 95, batch: 1200 // loss: 0.044\n", "epoch: 95, batch: 1300 // loss: 0.046\n", "epoch: 95, batch: 1400 // loss: 0.043\n", "epoch: 95, batch: 1500 // loss: 0.048\n", "epoch: 95, batch: 1600 // loss: 0.052\n", "epoch: 95, batch: 1700 // loss: 0.045\n", "epoch: 95, batch: 1800 // loss: 0.053\n", "epoch: 95, batch: 1900 // loss: 0.045\n", "epoch: 95, batch: 2000 // loss: 0.047\n", "epoch: 95, batch: 2100 // loss: 0.046\n", "epoch: 95, batch: 2200 // loss: 0.050\n", "epoch: 95, batch: 2300 // loss: 0.049\n", "epoch: 95, batch: 2400 // loss: 0.042\n", "epoch: 95, batch: 2500 // loss: 0.042\n", "epoch: 95, batch: 2600 // loss: 0.045\n", "epoch: 95, batch: 2700 // loss: 0.042\n", "epoch: 95, batch: 2800 // loss: 0.046\n", "epoch: 95, batch: 2900 // loss: 0.042\n", "epoch: 95, batch: 3000 // loss: 0.045\n", "epoch: 95, batch: 3100 // loss: 0.043\n", "epoch: 95, batch: 3200 // loss: 0.039\n", "epoch: 95, batch: 3300 // loss: 0.038\n", "epoch: 95, batch: 3400 // loss: 0.044\n", "epoch: 95, batch: 3500 // loss: 0.035\n", "epoch: 95, batch: 3600 // loss: 0.043\n", "epoch: 95, batch: 3700 // loss: 0.043\n", "\n", "epoch: 96, batch: 0 // loss: 0.053\n", "epoch: 96, batch: 100 // loss: 0.046\n", "epoch: 96, batch: 200 // loss: 0.043\n", "epoch: 96, batch: 300 // loss: 0.049\n", "epoch: 96, batch: 400 // loss: 0.046\n", "epoch: 96, batch: 500 // loss: 0.040\n", "epoch: 96, batch: 600 // loss: 0.040\n", "epoch: 96, batch: 700 // loss: 0.044\n", "epoch: 96, batch: 800 // loss: 0.042\n", "epoch: 96, batch: 900 // loss: 0.049\n", "epoch: 96, batch: 1000 // loss: 0.046\n", "epoch: 96, batch: 1100 // loss: 0.042\n", "epoch: 96, batch: 1200 // loss: 0.044\n", "epoch: 96, batch: 1300 // loss: 0.046\n", "epoch: 96, batch: 1400 // loss: 0.043\n", "epoch: 96, batch: 1500 // loss: 0.048\n", "epoch: 96, batch: 1600 // loss: 0.052\n", "epoch: 96, batch: 1700 // loss: 0.045\n", "epoch: 96, batch: 1800 // loss: 0.053\n", "epoch: 96, batch: 1900 // loss: 0.045\n", "epoch: 96, batch: 2000 // loss: 0.047\n", "epoch: 96, batch: 2100 // loss: 0.046\n", "epoch: 96, batch: 2200 // loss: 0.050\n", "epoch: 96, batch: 2300 // loss: 0.049\n", "epoch: 96, batch: 2400 // loss: 0.042\n", "epoch: 96, batch: 2500 // loss: 0.042\n", "epoch: 96, batch: 2600 // loss: 0.045\n", "epoch: 96, batch: 2700 // loss: 0.042\n", "epoch: 96, batch: 2800 // loss: 0.046\n", "epoch: 96, batch: 2900 // loss: 0.042\n", "epoch: 96, batch: 3000 // loss: 0.045\n", "epoch: 96, batch: 3100 // loss: 0.043\n", "epoch: 96, batch: 3200 // loss: 0.039\n", "epoch: 96, batch: 3300 // loss: 0.038\n", "epoch: 96, batch: 3400 // loss: 0.044\n", "epoch: 96, batch: 3500 // loss: 0.035\n", "epoch: 96, batch: 3600 // loss: 0.043\n", "epoch: 96, batch: 3700 // loss: 0.043\n", "\n", "epoch: 97, batch: 0 // loss: 0.053\n", "epoch: 97, batch: 100 // loss: 0.046\n", "epoch: 97, batch: 200 // loss: 0.043\n", "epoch: 97, batch: 300 // loss: 0.049\n", "epoch: 97, batch: 400 // loss: 0.046\n", "epoch: 97, batch: 500 // loss: 0.040\n", "epoch: 97, batch: 600 // loss: 0.040\n", "epoch: 97, batch: 700 // loss: 0.044\n", "epoch: 97, batch: 800 // loss: 0.042\n", "epoch: 97, batch: 900 // loss: 0.049\n", "epoch: 97, batch: 1000 // loss: 0.046\n", "epoch: 97, batch: 1100 // loss: 0.042\n", "epoch: 97, batch: 1200 // loss: 0.044\n", "epoch: 97, batch: 1300 // loss: 0.046\n", "epoch: 97, batch: 1400 // loss: 0.043\n", "epoch: 97, batch: 1500 // loss: 0.048\n", "epoch: 97, batch: 1600 // loss: 0.052\n", "epoch: 97, batch: 1700 // loss: 0.045\n", "epoch: 97, batch: 1800 // loss: 0.053\n", "epoch: 97, batch: 1900 // loss: 0.045\n", "epoch: 97, batch: 2000 // loss: 0.047\n", "epoch: 97, batch: 2100 // loss: 0.046\n", "epoch: 97, batch: 2200 // loss: 0.050\n", "epoch: 97, batch: 2300 // loss: 0.049\n", "epoch: 97, batch: 2400 // loss: 0.042\n", "epoch: 97, batch: 2500 // loss: 0.042\n", "epoch: 97, batch: 2600 // loss: 0.045\n", "epoch: 97, batch: 2700 // loss: 0.042\n", "epoch: 97, batch: 2800 // loss: 0.046\n", "epoch: 97, batch: 2900 // loss: 0.042\n", "epoch: 97, batch: 3000 // loss: 0.045\n", "epoch: 97, batch: 3100 // loss: 0.043\n", "epoch: 97, batch: 3200 // loss: 0.039\n", "epoch: 97, batch: 3300 // loss: 0.038\n", "epoch: 97, batch: 3400 // loss: 0.044\n", "epoch: 97, batch: 3500 // loss: 0.035\n", "epoch: 97, batch: 3600 // loss: 0.043\n", "epoch: 97, batch: 3700 // loss: 0.043\n", "\n", "epoch: 98, batch: 0 // loss: 0.053\n", "epoch: 98, batch: 100 // loss: 0.046\n", "epoch: 98, batch: 200 // loss: 0.043\n", "epoch: 98, batch: 300 // loss: 0.049\n", "epoch: 98, batch: 400 // loss: 0.046\n", "epoch: 98, batch: 500 // loss: 0.040\n", "epoch: 98, batch: 600 // loss: 0.040\n", "epoch: 98, batch: 700 // loss: 0.044\n", "epoch: 98, batch: 800 // loss: 0.042\n", "epoch: 98, batch: 900 // loss: 0.049\n", "epoch: 98, batch: 1000 // loss: 0.046\n", "epoch: 98, batch: 1100 // loss: 0.042\n", "epoch: 98, batch: 1200 // loss: 0.044\n", "epoch: 98, batch: 1300 // loss: 0.046\n", "epoch: 98, batch: 1400 // loss: 0.043\n", "epoch: 98, batch: 1500 // loss: 0.048\n", "epoch: 98, batch: 1600 // loss: 0.052\n", "epoch: 98, batch: 1700 // loss: 0.045\n", "epoch: 98, batch: 1800 // loss: 0.053\n", "epoch: 98, batch: 1900 // loss: 0.045\n", "epoch: 98, batch: 2000 // loss: 0.047\n", "epoch: 98, batch: 2100 // loss: 0.046\n", "epoch: 98, batch: 2200 // loss: 0.050\n", "epoch: 98, batch: 2300 // loss: 0.049\n", "epoch: 98, batch: 2400 // loss: 0.042\n", "epoch: 98, batch: 2500 // loss: 0.042\n", "epoch: 98, batch: 2600 // loss: 0.045\n", "epoch: 98, batch: 2700 // loss: 0.042\n", "epoch: 98, batch: 2800 // loss: 0.046\n", "epoch: 98, batch: 2900 // loss: 0.042\n", "epoch: 98, batch: 3000 // loss: 0.045\n", "epoch: 98, batch: 3100 // loss: 0.043\n", "epoch: 98, batch: 3200 // loss: 0.039\n", "epoch: 98, batch: 3300 // loss: 0.038\n", "epoch: 98, batch: 3400 // loss: 0.044\n", "epoch: 98, batch: 3500 // loss: 0.035\n", "epoch: 98, batch: 3600 // loss: 0.043\n", "epoch: 98, batch: 3700 // loss: 0.043\n", "\n", "epoch: 99, batch: 0 // loss: 0.053\n", "epoch: 99, batch: 100 // loss: 0.046\n", "epoch: 99, batch: 200 // loss: 0.043\n", "epoch: 99, batch: 300 // loss: 0.049\n", "epoch: 99, batch: 400 // loss: 0.046\n", "epoch: 99, batch: 500 // loss: 0.040\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 99, batch: 600 // loss: 0.040\n", "epoch: 99, batch: 700 // loss: 0.044\n", "epoch: 99, batch: 800 // loss: 0.042\n", "epoch: 99, batch: 900 // loss: 0.049\n", "epoch: 99, batch: 1000 // loss: 0.046\n", "epoch: 99, batch: 1100 // loss: 0.042\n", "epoch: 99, batch: 1200 // loss: 0.044\n", "epoch: 99, batch: 1300 // loss: 0.046\n", "epoch: 99, batch: 1400 // loss: 0.043\n", "epoch: 99, batch: 1500 // loss: 0.048\n", "epoch: 99, batch: 1600 // loss: 0.052\n", "epoch: 99, batch: 1700 // loss: 0.045\n", "epoch: 99, batch: 1800 // loss: 0.053\n", "epoch: 99, batch: 1900 // loss: 0.045\n", "epoch: 99, batch: 2000 // loss: 0.047\n", "epoch: 99, batch: 2100 // loss: 0.046\n", "epoch: 99, batch: 2200 // loss: 0.050\n", "epoch: 99, batch: 2300 // loss: 0.049\n", "epoch: 99, batch: 2400 // loss: 0.042\n", "epoch: 99, batch: 2500 // loss: 0.042\n", "epoch: 99, batch: 2600 // loss: 0.045\n", "epoch: 99, batch: 2700 // loss: 0.042\n", "epoch: 99, batch: 2800 // loss: 0.046\n", "epoch: 99, batch: 2900 // loss: 0.042\n", "epoch: 99, batch: 3000 // loss: 0.045\n", "epoch: 99, batch: 3100 // loss: 0.043\n", "epoch: 99, batch: 3200 // loss: 0.039\n", "epoch: 99, batch: 3300 // loss: 0.038\n", "epoch: 99, batch: 3400 // loss: 0.044\n", "epoch: 99, batch: 3500 // loss: 0.035\n", "epoch: 99, batch: 3600 // loss: 0.043\n", "epoch: 99, batch: 3700 // loss: 0.043\n", "\n", "epoch: 100, batch: 0 // loss: 0.053\n", "epoch: 100, batch: 100 // loss: 0.046\n", "epoch: 100, batch: 200 // loss: 0.043\n", "epoch: 100, batch: 300 // loss: 0.049\n", "epoch: 100, batch: 400 // loss: 0.046\n", "epoch: 100, batch: 500 // loss: 0.040\n", "epoch: 100, batch: 600 // loss: 0.040\n", "epoch: 100, batch: 700 // loss: 0.044\n", "epoch: 100, batch: 800 // loss: 0.042\n", "epoch: 100, batch: 900 // loss: 0.049\n", "epoch: 100, batch: 1000 // loss: 0.046\n", "epoch: 100, batch: 1100 // loss: 0.042\n", "epoch: 100, batch: 1200 // loss: 0.044\n", "epoch: 100, batch: 1300 // loss: 0.046\n", "epoch: 100, batch: 1400 // loss: 0.043\n", "epoch: 100, batch: 1500 // loss: 0.048\n", "epoch: 100, batch: 1600 // loss: 0.052\n", "epoch: 100, batch: 1700 // loss: 0.045\n", "epoch: 100, batch: 1800 // loss: 0.053\n", "epoch: 100, batch: 1900 // loss: 0.045\n", "epoch: 100, batch: 2000 // loss: 0.047\n", "epoch: 100, batch: 2100 // loss: 0.046\n", "epoch: 100, batch: 2200 // loss: 0.050\n", "epoch: 100, batch: 2300 // loss: 0.049\n", "epoch: 100, batch: 2400 // loss: 0.042\n", "epoch: 100, batch: 2500 // loss: 0.042\n", "epoch: 100, batch: 2600 // loss: 0.045\n", "epoch: 100, batch: 2700 // loss: 0.042\n", "epoch: 100, batch: 2800 // loss: 0.046\n", "epoch: 100, batch: 2900 // loss: 0.042\n", "epoch: 100, batch: 3000 // loss: 0.045\n", "epoch: 100, batch: 3100 // loss: 0.043\n", "epoch: 100, batch: 3200 // loss: 0.039\n", "epoch: 100, batch: 3300 // loss: 0.038\n", "epoch: 100, batch: 3400 // loss: 0.044\n", "epoch: 100, batch: 3500 // loss: 0.035\n", "epoch: 100, batch: 3600 // loss: 0.043\n", "epoch: 100, batch: 3700 // loss: 0.043\n", "\n", "epoch: 101, batch: 0 // loss: 0.053\n", "epoch: 101, batch: 100 // loss: 0.046\n", "epoch: 101, batch: 200 // loss: 0.043\n", "epoch: 101, batch: 300 // loss: 0.049\n", "epoch: 101, batch: 400 // loss: 0.046\n", "epoch: 101, batch: 500 // loss: 0.040\n", "epoch: 101, batch: 600 // loss: 0.040\n", "epoch: 101, batch: 700 // loss: 0.044\n", "epoch: 101, batch: 800 // loss: 0.042\n", "epoch: 101, batch: 900 // loss: 0.049\n", "epoch: 101, batch: 1000 // loss: 0.046\n", "epoch: 101, batch: 1100 // loss: 0.042\n", "epoch: 101, batch: 1200 // loss: 0.044\n", "epoch: 101, batch: 1300 // loss: 0.046\n", "epoch: 101, batch: 1400 // loss: 0.043\n", "epoch: 101, batch: 1500 // loss: 0.048\n", "epoch: 101, batch: 1600 // loss: 0.052\n", "epoch: 101, batch: 1700 // loss: 0.045\n", "epoch: 101, batch: 1800 // loss: 0.053\n", "epoch: 101, batch: 1900 // loss: 0.045\n", "epoch: 101, batch: 2000 // loss: 0.047\n", "epoch: 101, batch: 2100 // loss: 0.046\n", "epoch: 101, batch: 2200 // loss: 0.050\n", "epoch: 101, batch: 2300 // loss: 0.049\n", "epoch: 101, batch: 2400 // loss: 0.042\n", "epoch: 101, batch: 2500 // loss: 0.042\n", "epoch: 101, batch: 2600 // loss: 0.045\n", "epoch: 101, batch: 2700 // loss: 0.042\n", "epoch: 101, batch: 2800 // loss: 0.046\n", "epoch: 101, batch: 2900 // loss: 0.042\n", "epoch: 101, batch: 3000 // loss: 0.045\n", "epoch: 101, batch: 3100 // loss: 0.043\n", "epoch: 101, batch: 3200 // loss: 0.039\n", "epoch: 101, batch: 3300 // loss: 0.038\n", "epoch: 101, batch: 3400 // loss: 0.044\n", "epoch: 101, batch: 3500 // loss: 0.035\n", "epoch: 101, batch: 3600 // loss: 0.043\n", "epoch: 101, batch: 3700 // loss: 0.043\n", "\n", "epoch: 102, batch: 0 // loss: 0.053\n", "epoch: 102, batch: 100 // loss: 0.046\n", "epoch: 102, batch: 200 // loss: 0.043\n", "epoch: 102, batch: 300 // loss: 0.049\n", "epoch: 102, batch: 400 // loss: 0.046\n", "epoch: 102, batch: 500 // loss: 0.040\n", "epoch: 102, batch: 600 // loss: 0.040\n", "epoch: 102, batch: 700 // loss: 0.044\n", "epoch: 102, batch: 800 // loss: 0.042\n", "epoch: 102, batch: 900 // loss: 0.049\n", "epoch: 102, batch: 1000 // loss: 0.046\n", "epoch: 102, batch: 1100 // loss: 0.042\n", "epoch: 102, batch: 1200 // loss: 0.044\n", "epoch: 102, batch: 1300 // loss: 0.046\n", "epoch: 102, batch: 1400 // loss: 0.043\n", "epoch: 102, batch: 1500 // loss: 0.048\n", "epoch: 102, batch: 1600 // loss: 0.052\n", "epoch: 102, batch: 1700 // loss: 0.045\n", "epoch: 102, batch: 1800 // loss: 0.053\n", "epoch: 102, batch: 1900 // loss: 0.045\n", "epoch: 102, batch: 2000 // loss: 0.047\n", "epoch: 102, batch: 2100 // loss: 0.046\n", "epoch: 102, batch: 2200 // loss: 0.050\n", "epoch: 102, batch: 2300 // loss: 0.049\n", "epoch: 102, batch: 2400 // loss: 0.042\n", "epoch: 102, batch: 2500 // loss: 0.042\n", "epoch: 102, batch: 2600 // loss: 0.045\n", "epoch: 102, batch: 2700 // loss: 0.042\n", "epoch: 102, batch: 2800 // loss: 0.046\n", "epoch: 102, batch: 2900 // loss: 0.042\n", "epoch: 102, batch: 3000 // loss: 0.045\n", "epoch: 102, batch: 3100 // loss: 0.043\n", "epoch: 102, batch: 3200 // loss: 0.039\n", "epoch: 102, batch: 3300 // loss: 0.038\n", "epoch: 102, batch: 3400 // loss: 0.044\n", "epoch: 102, batch: 3500 // loss: 0.035\n", "epoch: 102, batch: 3600 // loss: 0.043\n", "epoch: 102, batch: 3700 // loss: 0.043\n", "\n", "epoch: 103, batch: 0 // loss: 0.053\n", "epoch: 103, batch: 100 // loss: 0.046\n", "epoch: 103, batch: 200 // loss: 0.043\n", "epoch: 103, batch: 300 // loss: 0.049\n", "epoch: 103, batch: 400 // loss: 0.046\n", "epoch: 103, batch: 500 // loss: 0.040\n", "epoch: 103, batch: 600 // loss: 0.040\n", "epoch: 103, batch: 700 // loss: 0.044\n", "epoch: 103, batch: 800 // loss: 0.042\n", "epoch: 103, batch: 900 // loss: 0.049\n", "epoch: 103, batch: 1000 // loss: 0.046\n", "epoch: 103, batch: 1100 // loss: 0.042\n", "epoch: 103, batch: 1200 // loss: 0.044\n", "epoch: 103, batch: 1300 // loss: 0.046\n", "epoch: 103, batch: 1400 // loss: 0.043\n", "epoch: 103, batch: 1500 // loss: 0.048\n", "epoch: 103, batch: 1600 // loss: 0.052\n", "epoch: 103, batch: 1700 // loss: 0.045\n", "epoch: 103, batch: 1800 // loss: 0.053\n", "epoch: 103, batch: 1900 // loss: 0.045\n", "epoch: 103, batch: 2000 // loss: 0.047\n", "epoch: 103, batch: 2100 // loss: 0.046\n", "epoch: 103, batch: 2200 // loss: 0.050\n", "epoch: 103, batch: 2300 // loss: 0.049\n", "epoch: 103, batch: 2400 // loss: 0.042\n", "epoch: 103, batch: 2500 // loss: 0.042\n", "epoch: 103, batch: 2600 // loss: 0.045\n", "epoch: 103, batch: 2700 // loss: 0.042\n", "epoch: 103, batch: 2800 // loss: 0.046\n", "epoch: 103, batch: 2900 // loss: 0.042\n", "epoch: 103, batch: 3000 // loss: 0.045\n", "epoch: 103, batch: 3100 // loss: 0.043\n", "epoch: 103, batch: 3200 // loss: 0.039\n", "epoch: 103, batch: 3300 // loss: 0.038\n", "epoch: 103, batch: 3400 // loss: 0.044\n", "epoch: 103, batch: 3500 // loss: 0.035\n", "epoch: 103, batch: 3600 // loss: 0.043\n", "epoch: 103, batch: 3700 // loss: 0.043\n", "\n", "epoch: 104, batch: 0 // loss: 0.053\n", "epoch: 104, batch: 100 // loss: 0.046\n", "epoch: 104, batch: 200 // loss: 0.043\n", "epoch: 104, batch: 300 // loss: 0.049\n", "epoch: 104, batch: 400 // loss: 0.046\n", "epoch: 104, batch: 500 // loss: 0.040\n", "epoch: 104, batch: 600 // loss: 0.040\n", "epoch: 104, batch: 700 // loss: 0.044\n", "epoch: 104, batch: 800 // loss: 0.042\n", "epoch: 104, batch: 900 // loss: 0.049\n", "epoch: 104, batch: 1000 // loss: 0.046\n", "epoch: 104, batch: 1100 // loss: 0.042\n", "epoch: 104, batch: 1200 // loss: 0.044\n", "epoch: 104, batch: 1300 // loss: 0.046\n", "epoch: 104, batch: 1400 // loss: 0.043\n", "epoch: 104, batch: 1500 // loss: 0.048\n", "epoch: 104, batch: 1600 // loss: 0.052\n", "epoch: 104, batch: 1700 // loss: 0.045\n", "epoch: 104, batch: 1800 // loss: 0.053\n", "epoch: 104, batch: 1900 // loss: 0.045\n", "epoch: 104, batch: 2000 // loss: 0.047\n", "epoch: 104, batch: 2100 // loss: 0.046\n", "epoch: 104, batch: 2200 // loss: 0.050\n", "epoch: 104, batch: 2300 // loss: 0.049\n", "epoch: 104, batch: 2400 // loss: 0.042\n", "epoch: 104, batch: 2500 // loss: 0.042\n", "epoch: 104, batch: 2600 // loss: 0.045\n", "epoch: 104, batch: 2700 // loss: 0.042\n", "epoch: 104, batch: 2800 // loss: 0.046\n", "epoch: 104, batch: 2900 // loss: 0.042\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 104, batch: 3000 // loss: 0.045\n", "epoch: 104, batch: 3100 // loss: 0.043\n", "epoch: 104, batch: 3200 // loss: 0.039\n", "epoch: 104, batch: 3300 // loss: 0.038\n", "epoch: 104, batch: 3400 // loss: 0.044\n", "epoch: 104, batch: 3500 // loss: 0.035\n", "epoch: 104, batch: 3600 // loss: 0.043\n", "epoch: 104, batch: 3700 // loss: 0.043\n", "\n", "epoch: 105, batch: 0 // loss: 0.053\n", "epoch: 105, batch: 100 // loss: 0.046\n", "epoch: 105, batch: 200 // loss: 0.043\n", "epoch: 105, batch: 300 // loss: 0.049\n", "epoch: 105, batch: 400 // loss: 0.046\n", "epoch: 105, batch: 500 // loss: 0.040\n", "epoch: 105, batch: 600 // loss: 0.040\n", "epoch: 105, batch: 700 // loss: 0.044\n", "epoch: 105, batch: 800 // loss: 0.042\n", "epoch: 105, batch: 900 // loss: 0.049\n", "epoch: 105, batch: 1000 // loss: 0.046\n", "epoch: 105, batch: 1100 // loss: 0.042\n", "epoch: 105, batch: 1200 // loss: 0.044\n", "epoch: 105, batch: 1300 // loss: 0.046\n", "epoch: 105, batch: 1400 // loss: 0.043\n", "epoch: 105, batch: 1500 // loss: 0.048\n", "epoch: 105, batch: 1600 // loss: 0.052\n", "epoch: 105, batch: 1700 // loss: 0.045\n", "epoch: 105, batch: 1800 // loss: 0.053\n", "epoch: 105, batch: 1900 // loss: 0.045\n", "epoch: 105, batch: 2000 // loss: 0.047\n", "epoch: 105, batch: 2100 // loss: 0.046\n", "epoch: 105, batch: 2200 // loss: 0.050\n", "epoch: 105, batch: 2300 // loss: 0.049\n", "epoch: 105, batch: 2400 // loss: 0.042\n", "epoch: 105, batch: 2500 // loss: 0.042\n", "epoch: 105, batch: 2600 // loss: 0.045\n", "epoch: 105, batch: 2700 // loss: 0.042\n", "epoch: 105, batch: 2800 // loss: 0.046\n", "epoch: 105, batch: 2900 // loss: 0.042\n", "epoch: 105, batch: 3000 // loss: 0.045\n", "epoch: 105, batch: 3100 // loss: 0.043\n", "epoch: 105, batch: 3200 // loss: 0.039\n", "epoch: 105, batch: 3300 // loss: 0.038\n", "epoch: 105, batch: 3400 // loss: 0.044\n", "epoch: 105, batch: 3500 // loss: 0.035\n", "epoch: 105, batch: 3600 // loss: 0.043\n", "epoch: 105, batch: 3700 // loss: 0.043\n", "\n", "epoch: 106, batch: 0 // loss: 0.053\n", "epoch: 106, batch: 100 // loss: 0.046\n", "epoch: 106, batch: 200 // loss: 0.043\n", "epoch: 106, batch: 300 // loss: 0.049\n", "epoch: 106, batch: 400 // loss: 0.046\n", "epoch: 106, batch: 500 // loss: 0.040\n", "epoch: 106, batch: 600 // loss: 0.040\n", "epoch: 106, batch: 700 // loss: 0.044\n", "epoch: 106, batch: 800 // loss: 0.042\n", "epoch: 106, batch: 900 // loss: 0.049\n", "epoch: 106, batch: 1000 // loss: 0.046\n", "epoch: 106, batch: 1100 // loss: 0.042\n", "epoch: 106, batch: 1200 // loss: 0.044\n", "epoch: 106, batch: 1300 // loss: 0.046\n", "epoch: 106, batch: 1400 // loss: 0.043\n", "epoch: 106, batch: 1500 // loss: 0.048\n", "epoch: 106, batch: 1600 // loss: 0.052\n", "epoch: 106, batch: 1700 // loss: 0.045\n", "epoch: 106, batch: 1800 // loss: 0.053\n", "epoch: 106, batch: 1900 // loss: 0.045\n", "epoch: 106, batch: 2000 // loss: 0.047\n", "epoch: 106, batch: 2100 // loss: 0.046\n", "epoch: 106, batch: 2200 // loss: 0.050\n", "epoch: 106, batch: 2300 // loss: 0.049\n", "epoch: 106, batch: 2400 // loss: 0.042\n", "epoch: 106, batch: 2500 // loss: 0.042\n", "epoch: 106, batch: 2600 // loss: 0.045\n", "epoch: 106, batch: 2700 // loss: 0.042\n", "epoch: 106, batch: 2800 // loss: 0.046\n", "epoch: 106, batch: 2900 // loss: 0.042\n", "epoch: 106, batch: 3000 // loss: 0.045\n", "epoch: 106, batch: 3100 // loss: 0.043\n", "epoch: 106, batch: 3200 // loss: 0.039\n", "epoch: 106, batch: 3300 // loss: 0.038\n", "epoch: 106, batch: 3400 // loss: 0.044\n", "epoch: 106, batch: 3500 // loss: 0.035\n", "epoch: 106, batch: 3600 // loss: 0.043\n", "epoch: 106, batch: 3700 // loss: 0.043\n", "\n", "epoch: 107, batch: 0 // loss: 0.053\n", "epoch: 107, batch: 100 // loss: 0.046\n", "epoch: 107, batch: 200 // loss: 0.043\n", "epoch: 107, batch: 300 // loss: 0.049\n", "epoch: 107, batch: 400 // loss: 0.046\n", "epoch: 107, batch: 500 // loss: 0.040\n", "epoch: 107, batch: 600 // loss: 0.040\n", "epoch: 107, batch: 700 // loss: 0.044\n", "epoch: 107, batch: 800 // loss: 0.042\n", "epoch: 107, batch: 900 // loss: 0.049\n", "epoch: 107, batch: 1000 // loss: 0.046\n", "epoch: 107, batch: 1100 // loss: 0.042\n", "epoch: 107, batch: 1200 // loss: 0.044\n", "epoch: 107, batch: 1300 // loss: 0.046\n", "epoch: 107, batch: 1400 // loss: 0.043\n", "epoch: 107, batch: 1500 // loss: 0.048\n", "epoch: 107, batch: 1600 // loss: 0.052\n", "epoch: 107, batch: 1700 // loss: 0.045\n", "epoch: 107, batch: 1800 // loss: 0.053\n", "epoch: 107, batch: 1900 // loss: 0.045\n", "epoch: 107, batch: 2000 // loss: 0.047\n", "epoch: 107, batch: 2100 // loss: 0.046\n", "epoch: 107, batch: 2200 // loss: 0.050\n", "epoch: 107, batch: 2300 // loss: 0.049\n", "epoch: 107, batch: 2400 // loss: 0.042\n", "epoch: 107, batch: 2500 // loss: 0.042\n", "epoch: 107, batch: 2600 // loss: 0.045\n", "epoch: 107, batch: 2700 // loss: 0.042\n", "epoch: 107, batch: 2800 // loss: 0.046\n", "epoch: 107, batch: 2900 // loss: 0.042\n", "epoch: 107, batch: 3000 // loss: 0.045\n", "epoch: 107, batch: 3100 // loss: 0.043\n", "epoch: 107, batch: 3200 // loss: 0.039\n", "epoch: 107, batch: 3300 // loss: 0.038\n", "epoch: 107, batch: 3400 // loss: 0.044\n", "epoch: 107, batch: 3500 // loss: 0.035\n", "epoch: 107, batch: 3600 // loss: 0.043\n", "epoch: 107, batch: 3700 // loss: 0.043\n", "\n", "epoch: 108, batch: 0 // loss: 0.053\n", "epoch: 108, batch: 100 // loss: 0.046\n", "epoch: 108, batch: 200 // loss: 0.043\n", "epoch: 108, batch: 300 // loss: 0.049\n", "epoch: 108, batch: 400 // loss: 0.046\n", "epoch: 108, batch: 500 // loss: 0.040\n", "epoch: 108, batch: 600 // loss: 0.040\n", "epoch: 108, batch: 700 // loss: 0.044\n", "epoch: 108, batch: 800 // loss: 0.042\n", "epoch: 108, batch: 900 // loss: 0.049\n", "epoch: 108, batch: 1000 // loss: 0.046\n", "epoch: 108, batch: 1100 // loss: 0.042\n", "epoch: 108, batch: 1200 // loss: 0.044\n", "epoch: 108, batch: 1300 // loss: 0.046\n", "epoch: 108, batch: 1400 // loss: 0.043\n", "epoch: 108, batch: 1500 // loss: 0.048\n", "epoch: 108, batch: 1600 // loss: 0.052\n", "epoch: 108, batch: 1700 // loss: 0.045\n", "epoch: 108, batch: 1800 // loss: 0.053\n", "epoch: 108, batch: 1900 // loss: 0.045\n", "epoch: 108, batch: 2000 // loss: 0.047\n", "epoch: 108, batch: 2100 // loss: 0.046\n", "epoch: 108, batch: 2200 // loss: 0.050\n", "epoch: 108, batch: 2300 // loss: 0.049\n", "epoch: 108, batch: 2400 // loss: 0.042\n", "epoch: 108, batch: 2500 // loss: 0.042\n", "epoch: 108, batch: 2600 // loss: 0.045\n", "epoch: 108, batch: 2700 // loss: 0.042\n", "epoch: 108, batch: 2800 // loss: 0.046\n", "epoch: 108, batch: 2900 // loss: 0.042\n", "epoch: 108, batch: 3000 // loss: 0.045\n", "epoch: 108, batch: 3100 // loss: 0.043\n", "epoch: 108, batch: 3200 // loss: 0.039\n", "epoch: 108, batch: 3300 // loss: 0.038\n", "epoch: 108, batch: 3400 // loss: 0.044\n", "epoch: 108, batch: 3500 // loss: 0.035\n", "epoch: 108, batch: 3600 // loss: 0.043\n", "epoch: 108, batch: 3700 // loss: 0.043\n", "\n", "epoch: 109, batch: 0 // loss: 0.053\n", "epoch: 109, batch: 100 // loss: 0.046\n", "epoch: 109, batch: 200 // loss: 0.043\n", "epoch: 109, batch: 300 // loss: 0.049\n", "epoch: 109, batch: 400 // loss: 0.046\n", "epoch: 109, batch: 500 // loss: 0.040\n", "epoch: 109, batch: 600 // loss: 0.040\n", "epoch: 109, batch: 700 // loss: 0.044\n", "epoch: 109, batch: 800 // loss: 0.042\n", "epoch: 109, batch: 900 // loss: 0.049\n", "epoch: 109, batch: 1000 // loss: 0.046\n", "epoch: 109, batch: 1100 // loss: 0.042\n", "epoch: 109, batch: 1200 // loss: 0.044\n", "epoch: 109, batch: 1300 // loss: 0.046\n", "epoch: 109, batch: 1400 // loss: 0.043\n", "epoch: 109, batch: 1500 // loss: 0.048\n", "epoch: 109, batch: 1600 // loss: 0.052\n", "epoch: 109, batch: 1700 // loss: 0.045\n", "epoch: 109, batch: 1800 // loss: 0.053\n", "epoch: 109, batch: 1900 // loss: 0.045\n", "epoch: 109, batch: 2000 // loss: 0.047\n", "epoch: 109, batch: 2100 // loss: 0.046\n", "epoch: 109, batch: 2200 // loss: 0.050\n", "epoch: 109, batch: 2300 // loss: 0.049\n", "epoch: 109, batch: 2400 // loss: 0.042\n", "epoch: 109, batch: 2500 // loss: 0.042\n", "epoch: 109, batch: 2600 // loss: 0.045\n", "epoch: 109, batch: 2700 // loss: 0.042\n", "epoch: 109, batch: 2800 // loss: 0.046\n", "epoch: 109, batch: 2900 // loss: 0.042\n", "epoch: 109, batch: 3000 // loss: 0.045\n", "epoch: 109, batch: 3100 // loss: 0.043\n", "epoch: 109, batch: 3200 // loss: 0.039\n", "epoch: 109, batch: 3300 // loss: 0.038\n", "epoch: 109, batch: 3400 // loss: 0.044\n", "epoch: 109, batch: 3500 // loss: 0.035\n", "epoch: 109, batch: 3600 // loss: 0.043\n", "epoch: 109, batch: 3700 // loss: 0.043\n", "\n", "epoch: 110, batch: 0 // loss: 0.053\n", "epoch: 110, batch: 100 // loss: 0.046\n", "epoch: 110, batch: 200 // loss: 0.043\n", "epoch: 110, batch: 300 // loss: 0.049\n", "epoch: 110, batch: 400 // loss: 0.046\n", "epoch: 110, batch: 500 // loss: 0.040\n", "epoch: 110, batch: 600 // loss: 0.040\n", "epoch: 110, batch: 700 // loss: 0.044\n", "epoch: 110, batch: 800 // loss: 0.042\n", "epoch: 110, batch: 900 // loss: 0.049\n", "epoch: 110, batch: 1000 // loss: 0.046\n", "epoch: 110, batch: 1100 // loss: 0.042\n", "epoch: 110, batch: 1200 // loss: 0.044\n", "epoch: 110, batch: 1300 // loss: 0.046\n", "epoch: 110, batch: 1400 // loss: 0.043\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 110, batch: 1500 // loss: 0.048\n", "epoch: 110, batch: 1600 // loss: 0.052\n", "epoch: 110, batch: 1700 // loss: 0.045\n", "epoch: 110, batch: 1800 // loss: 0.053\n", "epoch: 110, batch: 1900 // loss: 0.045\n", "epoch: 110, batch: 2000 // loss: 0.047\n", "epoch: 110, batch: 2100 // loss: 0.046\n", "epoch: 110, batch: 2200 // loss: 0.050\n", "epoch: 110, batch: 2300 // loss: 0.049\n", "epoch: 110, batch: 2400 // loss: 0.042\n", "epoch: 110, batch: 2500 // loss: 0.042\n", "epoch: 110, batch: 2600 // loss: 0.045\n", "epoch: 110, batch: 2700 // loss: 0.042\n", "epoch: 110, batch: 2800 // loss: 0.046\n", "epoch: 110, batch: 2900 // loss: 0.042\n", "epoch: 110, batch: 3000 // loss: 0.045\n", "epoch: 110, batch: 3100 // loss: 0.043\n", "epoch: 110, batch: 3200 // loss: 0.039\n", "epoch: 110, batch: 3300 // loss: 0.038\n", "epoch: 110, batch: 3400 // loss: 0.044\n", "epoch: 110, batch: 3500 // loss: 0.035\n", "epoch: 110, batch: 3600 // loss: 0.043\n", "epoch: 110, batch: 3700 // loss: 0.043\n", "\n", "epoch: 111, batch: 0 // loss: 0.053\n", "epoch: 111, batch: 100 // loss: 0.046\n", "epoch: 111, batch: 200 // loss: 0.043\n", "epoch: 111, batch: 300 // loss: 0.049\n", "epoch: 111, batch: 400 // loss: 0.046\n", "epoch: 111, batch: 500 // loss: 0.040\n", "epoch: 111, batch: 600 // loss: 0.040\n", "epoch: 111, batch: 700 // loss: 0.044\n", "epoch: 111, batch: 800 // loss: 0.042\n", "epoch: 111, batch: 900 // loss: 0.049\n", "epoch: 111, batch: 1000 // loss: 0.046\n", "epoch: 111, batch: 1100 // loss: 0.042\n", "epoch: 111, batch: 1200 // loss: 0.044\n", "epoch: 111, batch: 1300 // loss: 0.046\n", "epoch: 111, batch: 1400 // loss: 0.043\n", "epoch: 111, batch: 1500 // loss: 0.048\n", "epoch: 111, batch: 1600 // loss: 0.052\n", "epoch: 111, batch: 1700 // loss: 0.045\n", "epoch: 111, batch: 1800 // loss: 0.053\n", "epoch: 111, batch: 1900 // loss: 0.045\n", "epoch: 111, batch: 2000 // loss: 0.047\n", "epoch: 111, batch: 2100 // loss: 0.046\n", "epoch: 111, batch: 2200 // loss: 0.050\n", "epoch: 111, batch: 2300 // loss: 0.049\n", "epoch: 111, batch: 2400 // loss: 0.042\n", "epoch: 111, batch: 2500 // loss: 0.042\n", "epoch: 111, batch: 2600 // loss: 0.045\n", "epoch: 111, batch: 2700 // loss: 0.042\n", "epoch: 111, batch: 2800 // loss: 0.046\n", "epoch: 111, batch: 2900 // loss: 0.042\n", "epoch: 111, batch: 3000 // loss: 0.045\n", "epoch: 111, batch: 3100 // loss: 0.043\n", "epoch: 111, batch: 3200 // loss: 0.039\n", "epoch: 111, batch: 3300 // loss: 0.038\n", "epoch: 111, batch: 3400 // loss: 0.044\n", "epoch: 111, batch: 3500 // loss: 0.035\n", "epoch: 111, batch: 3600 // loss: 0.043\n", "epoch: 111, batch: 3700 // loss: 0.043\n", "\n", "epoch: 112, batch: 0 // loss: 0.053\n", "epoch: 112, batch: 100 // loss: 0.046\n", "epoch: 112, batch: 200 // loss: 0.043\n", "epoch: 112, batch: 300 // loss: 0.049\n", "epoch: 112, batch: 400 // loss: 0.046\n", "epoch: 112, batch: 500 // loss: 0.040\n", "epoch: 112, batch: 600 // loss: 0.040\n", "epoch: 112, batch: 700 // loss: 0.044\n", "epoch: 112, batch: 800 // loss: 0.042\n", "epoch: 112, batch: 900 // loss: 0.049\n", "epoch: 112, batch: 1000 // loss: 0.046\n", "epoch: 112, batch: 1100 // loss: 0.042\n", "epoch: 112, batch: 1200 // loss: 0.044\n", "epoch: 112, batch: 1300 // loss: 0.046\n", "epoch: 112, batch: 1400 // loss: 0.043\n", "epoch: 112, batch: 1500 // loss: 0.048\n", "epoch: 112, batch: 1600 // loss: 0.052\n", "epoch: 112, batch: 1700 // loss: 0.045\n", "epoch: 112, batch: 1800 // loss: 0.053\n", "epoch: 112, batch: 1900 // loss: 0.045\n", "epoch: 112, batch: 2000 // loss: 0.047\n", "epoch: 112, batch: 2100 // loss: 0.046\n", "epoch: 112, batch: 2200 // loss: 0.050\n", "epoch: 112, batch: 2300 // loss: 0.049\n", "epoch: 112, batch: 2400 // loss: 0.042\n", "epoch: 112, batch: 2500 // loss: 0.042\n", "epoch: 112, batch: 2600 // loss: 0.045\n", "epoch: 112, batch: 2700 // loss: 0.042\n", "epoch: 112, batch: 2800 // loss: 0.046\n", "epoch: 112, batch: 2900 // loss: 0.042\n", "epoch: 112, batch: 3000 // loss: 0.045\n", "epoch: 112, batch: 3100 // loss: 0.043\n", "epoch: 112, batch: 3200 // loss: 0.039\n", "epoch: 112, batch: 3300 // loss: 0.038\n", "epoch: 112, batch: 3400 // loss: 0.044\n", "epoch: 112, batch: 3500 // loss: 0.035\n", "epoch: 112, batch: 3600 // loss: 0.043\n", "epoch: 112, batch: 3700 // loss: 0.043\n", "\n", "epoch: 113, batch: 0 // loss: 0.053\n", "epoch: 113, batch: 100 // loss: 0.046\n", "epoch: 113, batch: 200 // loss: 0.043\n", "epoch: 113, batch: 300 // loss: 0.049\n", "epoch: 113, batch: 400 // loss: 0.046\n", "epoch: 113, batch: 500 // loss: 0.040\n", "epoch: 113, batch: 600 // loss: 0.040\n", "epoch: 113, batch: 700 // loss: 0.044\n", "epoch: 113, batch: 800 // loss: 0.042\n", "epoch: 113, batch: 900 // loss: 0.049\n", "epoch: 113, batch: 1000 // loss: 0.046\n", "epoch: 113, batch: 1100 // loss: 0.042\n", "epoch: 113, batch: 1200 // loss: 0.044\n", "epoch: 113, batch: 1300 // loss: 0.046\n", "epoch: 113, batch: 1400 // loss: 0.043\n", "epoch: 113, batch: 1500 // loss: 0.048\n", "epoch: 113, batch: 1600 // loss: 0.052\n", "epoch: 113, batch: 1700 // loss: 0.045\n", "epoch: 113, batch: 1800 // loss: 0.053\n", "epoch: 113, batch: 1900 // loss: 0.045\n", "epoch: 113, batch: 2000 // loss: 0.047\n", "epoch: 113, batch: 2100 // loss: 0.046\n", "epoch: 113, batch: 2200 // loss: 0.050\n", "epoch: 113, batch: 2300 // loss: 0.049\n", "epoch: 113, batch: 2400 // loss: 0.042\n", "epoch: 113, batch: 2500 // loss: 0.042\n", "epoch: 113, batch: 2600 // loss: 0.045\n", "epoch: 113, batch: 2700 // loss: 0.042\n", "epoch: 113, batch: 2800 // loss: 0.046\n", "epoch: 113, batch: 2900 // loss: 0.042\n", "epoch: 113, batch: 3000 // loss: 0.045\n", "epoch: 113, batch: 3100 // loss: 0.043\n", "epoch: 113, batch: 3200 // loss: 0.039\n", "epoch: 113, batch: 3300 // loss: 0.038\n", "epoch: 113, batch: 3400 // loss: 0.044\n", "epoch: 113, batch: 3500 // loss: 0.035\n", "epoch: 113, batch: 3600 // loss: 0.043\n", "epoch: 113, batch: 3700 // loss: 0.043\n", "\n", "epoch: 114, batch: 0 // loss: 0.053\n", "epoch: 114, batch: 100 // loss: 0.046\n", "epoch: 114, batch: 200 // loss: 0.043\n", "epoch: 114, batch: 300 // loss: 0.049\n", "epoch: 114, batch: 400 // loss: 0.046\n", "epoch: 114, batch: 500 // loss: 0.040\n", "epoch: 114, batch: 600 // loss: 0.040\n", "epoch: 114, batch: 700 // loss: 0.044\n", "epoch: 114, batch: 800 // loss: 0.042\n", "epoch: 114, batch: 900 // loss: 0.049\n", "epoch: 114, batch: 1000 // loss: 0.046\n", "epoch: 114, batch: 1100 // loss: 0.042\n", "epoch: 114, batch: 1200 // loss: 0.044\n", "epoch: 114, batch: 1300 // loss: 0.046\n", "epoch: 114, batch: 1400 // loss: 0.043\n", "epoch: 114, batch: 1500 // loss: 0.048\n", "epoch: 114, batch: 1600 // loss: 0.052\n", "epoch: 114, batch: 1700 // loss: 0.045\n", "epoch: 114, batch: 1800 // loss: 0.053\n", "epoch: 114, batch: 1900 // loss: 0.045\n", "epoch: 114, batch: 2000 // loss: 0.047\n", "epoch: 114, batch: 2100 // loss: 0.046\n", "epoch: 114, batch: 2200 // loss: 0.050\n", "epoch: 114, batch: 2300 // loss: 0.049\n", "epoch: 114, batch: 2400 // loss: 0.042\n", "epoch: 114, batch: 2500 // loss: 0.042\n", "epoch: 114, batch: 2600 // loss: 0.045\n", "epoch: 114, batch: 2700 // loss: 0.042\n", "epoch: 114, batch: 2800 // loss: 0.046\n", "epoch: 114, batch: 2900 // loss: 0.042\n", "epoch: 114, batch: 3000 // loss: 0.045\n", "epoch: 114, batch: 3100 // loss: 0.043\n", "epoch: 114, batch: 3200 // loss: 0.039\n", "epoch: 114, batch: 3300 // loss: 0.038\n", "epoch: 114, batch: 3400 // loss: 0.044\n", "epoch: 114, batch: 3500 // loss: 0.035\n", "epoch: 114, batch: 3600 // loss: 0.043\n", "epoch: 114, batch: 3700 // loss: 0.043\n", "\n", "epoch: 115, batch: 0 // loss: 0.053\n", "epoch: 115, batch: 100 // loss: 0.046\n", "epoch: 115, batch: 200 // loss: 0.043\n", "epoch: 115, batch: 300 // loss: 0.049\n", "epoch: 115, batch: 400 // loss: 0.046\n", "epoch: 115, batch: 500 // loss: 0.040\n", "epoch: 115, batch: 600 // loss: 0.040\n", "epoch: 115, batch: 700 // loss: 0.044\n", "epoch: 115, batch: 800 // loss: 0.042\n", "epoch: 115, batch: 900 // loss: 0.049\n", "epoch: 115, batch: 1000 // loss: 0.046\n", "epoch: 115, batch: 1100 // loss: 0.042\n", "epoch: 115, batch: 1200 // loss: 0.044\n", "epoch: 115, batch: 1300 // loss: 0.046\n", "epoch: 115, batch: 1400 // loss: 0.043\n", "epoch: 115, batch: 1500 // loss: 0.048\n", "epoch: 115, batch: 1600 // loss: 0.052\n", "epoch: 115, batch: 1700 // loss: 0.045\n", "epoch: 115, batch: 1800 // loss: 0.053\n", "epoch: 115, batch: 1900 // loss: 0.045\n", "epoch: 115, batch: 2000 // loss: 0.047\n", "epoch: 115, batch: 2100 // loss: 0.046\n", "epoch: 115, batch: 2200 // loss: 0.050\n", "epoch: 115, batch: 2300 // loss: 0.049\n", "epoch: 115, batch: 2400 // loss: 0.042\n", "epoch: 115, batch: 2500 // loss: 0.042\n", "epoch: 115, batch: 2600 // loss: 0.045\n", "epoch: 115, batch: 2700 // loss: 0.042\n", "epoch: 115, batch: 2800 // loss: 0.046\n", "epoch: 115, batch: 2900 // loss: 0.042\n", "epoch: 115, batch: 3000 // loss: 0.045\n", "epoch: 115, batch: 3100 // loss: 0.043\n", "epoch: 115, batch: 3200 // loss: 0.039\n", "epoch: 115, batch: 3300 // loss: 0.038\n", "epoch: 115, batch: 3400 // loss: 0.044\n", "epoch: 115, batch: 3500 // loss: 0.035\n", "epoch: 115, batch: 3600 // loss: 0.043\n", "epoch: 115, batch: 3700 // loss: 0.043\n", "\n", "epoch: 116, batch: 0 // loss: 0.053\n", "epoch: 116, batch: 100 // loss: 0.046\n", "epoch: 116, batch: 200 // loss: 0.043\n", "epoch: 116, batch: 300 // loss: 0.049\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 116, batch: 400 // loss: 0.046\n", "epoch: 116, batch: 500 // loss: 0.040\n", "epoch: 116, batch: 600 // loss: 0.040\n", "epoch: 116, batch: 700 // loss: 0.044\n", "epoch: 116, batch: 800 // loss: 0.042\n", "epoch: 116, batch: 900 // loss: 0.049\n", "epoch: 116, batch: 1000 // loss: 0.046\n", "epoch: 116, batch: 1100 // loss: 0.042\n", "epoch: 116, batch: 1200 // loss: 0.044\n", "epoch: 116, batch: 1300 // loss: 0.046\n", "epoch: 116, batch: 1400 // loss: 0.043\n", "epoch: 116, batch: 1500 // loss: 0.048\n", "epoch: 116, batch: 1600 // loss: 0.052\n", "epoch: 116, batch: 1700 // loss: 0.045\n", "epoch: 116, batch: 1800 // loss: 0.053\n", "epoch: 116, batch: 1900 // loss: 0.045\n", "epoch: 116, batch: 2000 // loss: 0.047\n", "epoch: 116, batch: 2100 // loss: 0.046\n", "epoch: 116, batch: 2200 // loss: 0.050\n", "epoch: 116, batch: 2300 // loss: 0.049\n", "epoch: 116, batch: 2400 // loss: 0.042\n", "epoch: 116, batch: 2500 // loss: 0.042\n", "epoch: 116, batch: 2600 // loss: 0.045\n", "epoch: 116, batch: 2700 // loss: 0.042\n", "epoch: 116, batch: 2800 // loss: 0.046\n", "epoch: 116, batch: 2900 // loss: 0.042\n", "epoch: 116, batch: 3000 // loss: 0.045\n", "epoch: 116, batch: 3100 // loss: 0.043\n", "epoch: 116, batch: 3200 // loss: 0.039\n", "epoch: 116, batch: 3300 // loss: 0.038\n", "epoch: 116, batch: 3400 // loss: 0.044\n", "epoch: 116, batch: 3500 // loss: 0.035\n", "epoch: 116, batch: 3600 // loss: 0.043\n", "epoch: 116, batch: 3700 // loss: 0.043\n", "\n", "epoch: 117, batch: 0 // loss: 0.053\n", "epoch: 117, batch: 100 // loss: 0.046\n", "epoch: 117, batch: 200 // loss: 0.043\n", "epoch: 117, batch: 300 // loss: 0.049\n", "epoch: 117, batch: 400 // loss: 0.046\n", "epoch: 117, batch: 500 // loss: 0.040\n", "epoch: 117, batch: 600 // loss: 0.040\n", "epoch: 117, batch: 700 // loss: 0.044\n", "epoch: 117, batch: 800 // loss: 0.042\n", "epoch: 117, batch: 900 // loss: 0.049\n", "epoch: 117, batch: 1000 // loss: 0.046\n", "epoch: 117, batch: 1100 // loss: 0.042\n", "epoch: 117, batch: 1200 // loss: 0.044\n", "epoch: 117, batch: 1300 // loss: 0.046\n", "epoch: 117, batch: 1400 // loss: 0.043\n", "epoch: 117, batch: 1500 // loss: 0.048\n", "epoch: 117, batch: 1600 // loss: 0.052\n", "epoch: 117, batch: 1700 // loss: 0.045\n", "epoch: 117, batch: 1800 // loss: 0.053\n", "epoch: 117, batch: 1900 // loss: 0.045\n", "epoch: 117, batch: 2000 // loss: 0.047\n", "epoch: 117, batch: 2100 // loss: 0.046\n", "epoch: 117, batch: 2200 // loss: 0.050\n", "epoch: 117, batch: 2300 // loss: 0.049\n", "epoch: 117, batch: 2400 // loss: 0.042\n", "epoch: 117, batch: 2500 // loss: 0.042\n", "epoch: 117, batch: 2600 // loss: 0.045\n", "epoch: 117, batch: 2700 // loss: 0.042\n", "epoch: 117, batch: 2800 // loss: 0.046\n", "epoch: 117, batch: 2900 // loss: 0.042\n", "epoch: 117, batch: 3000 // loss: 0.045\n", "epoch: 117, batch: 3100 // loss: 0.043\n", "epoch: 117, batch: 3200 // loss: 0.039\n", "epoch: 117, batch: 3300 // loss: 0.038\n", "epoch: 117, batch: 3400 // loss: 0.044\n", "epoch: 117, batch: 3500 // loss: 0.035\n", "epoch: 117, batch: 3600 // loss: 0.043\n", "epoch: 117, batch: 3700 // loss: 0.043\n", "\n", "epoch: 118, batch: 0 // loss: 0.053\n", "epoch: 118, batch: 100 // loss: 0.046\n", "epoch: 118, batch: 200 // loss: 0.043\n", "epoch: 118, batch: 300 // loss: 0.049\n", "epoch: 118, batch: 400 // loss: 0.046\n", "epoch: 118, batch: 500 // loss: 0.040\n", "epoch: 118, batch: 600 // loss: 0.040\n", "epoch: 118, batch: 700 // loss: 0.044\n", "epoch: 118, batch: 800 // loss: 0.042\n", "epoch: 118, batch: 900 // loss: 0.049\n", "epoch: 118, batch: 1000 // loss: 0.046\n", "epoch: 118, batch: 1100 // loss: 0.042\n", "epoch: 118, batch: 1200 // loss: 0.044\n", "epoch: 118, batch: 1300 // loss: 0.046\n", "epoch: 118, batch: 1400 // loss: 0.043\n", "epoch: 118, batch: 1500 // loss: 0.048\n", "epoch: 118, batch: 1600 // loss: 0.052\n", "epoch: 118, batch: 1700 // loss: 0.045\n", "epoch: 118, batch: 1800 // loss: 0.053\n", "epoch: 118, batch: 1900 // loss: 0.045\n", "epoch: 118, batch: 2000 // loss: 0.047\n", "epoch: 118, batch: 2100 // loss: 0.046\n", "epoch: 118, batch: 2200 // loss: 0.050\n", "epoch: 118, batch: 2300 // loss: 0.049\n", "epoch: 118, batch: 2400 // loss: 0.042\n", "epoch: 118, batch: 2500 // loss: 0.042\n", "epoch: 118, batch: 2600 // loss: 0.045\n", "epoch: 118, batch: 2700 // loss: 0.042\n", "epoch: 118, batch: 2800 // loss: 0.046\n", "epoch: 118, batch: 2900 // loss: 0.042\n", "epoch: 118, batch: 3000 // loss: 0.045\n", "epoch: 118, batch: 3100 // loss: 0.043\n", "epoch: 118, batch: 3200 // loss: 0.039\n", "epoch: 118, batch: 3300 // loss: 0.038\n", "epoch: 118, batch: 3400 // loss: 0.044\n", "epoch: 118, batch: 3500 // loss: 0.035\n", "epoch: 118, batch: 3600 // loss: 0.043\n", "epoch: 118, batch: 3700 // loss: 0.043\n", "\n", "epoch: 119, batch: 0 // loss: 0.053\n", "epoch: 119, batch: 100 // loss: 0.046\n", "epoch: 119, batch: 200 // loss: 0.043\n", "epoch: 119, batch: 300 // loss: 0.049\n", "epoch: 119, batch: 400 // loss: 0.046\n", "epoch: 119, batch: 500 // loss: 0.040\n", "epoch: 119, batch: 600 // loss: 0.040\n", "epoch: 119, batch: 700 // loss: 0.044\n", "epoch: 119, batch: 800 // loss: 0.042\n", "epoch: 119, batch: 900 // loss: 0.049\n", "epoch: 119, batch: 1000 // loss: 0.046\n", "epoch: 119, batch: 1100 // loss: 0.042\n", "epoch: 119, batch: 1200 // loss: 0.044\n", "epoch: 119, batch: 1300 // loss: 0.046\n", "epoch: 119, batch: 1400 // loss: 0.043\n", "epoch: 119, batch: 1500 // loss: 0.048\n", "epoch: 119, batch: 1600 // loss: 0.052\n", "epoch: 119, batch: 1700 // loss: 0.045\n", "epoch: 119, batch: 1800 // loss: 0.053\n", "epoch: 119, batch: 1900 // loss: 0.045\n", "epoch: 119, batch: 2000 // loss: 0.047\n", "epoch: 119, batch: 2100 // loss: 0.046\n", "epoch: 119, batch: 2200 // loss: 0.050\n", "epoch: 119, batch: 2300 // loss: 0.049\n", "epoch: 119, batch: 2400 // loss: 0.042\n", "epoch: 119, batch: 2500 // loss: 0.042\n", "epoch: 119, batch: 2600 // loss: 0.045\n", "epoch: 119, batch: 2700 // loss: 0.042\n", "epoch: 119, batch: 2800 // loss: 0.046\n", "epoch: 119, batch: 2900 // loss: 0.042\n", "epoch: 119, batch: 3000 // loss: 0.045\n", "epoch: 119, batch: 3100 // loss: 0.043\n", "epoch: 119, batch: 3200 // loss: 0.039\n", "epoch: 119, batch: 3300 // loss: 0.038\n", "epoch: 119, batch: 3400 // loss: 0.044\n", "epoch: 119, batch: 3500 // loss: 0.035\n", "epoch: 119, batch: 3600 // loss: 0.043\n", "epoch: 119, batch: 3700 // loss: 0.043\n", "\n", "epoch: 120, batch: 0 // loss: 0.053\n", "epoch: 120, batch: 100 // loss: 0.046\n", "epoch: 120, batch: 200 // loss: 0.043\n", "epoch: 120, batch: 300 // loss: 0.049\n", "epoch: 120, batch: 400 // loss: 0.046\n", "epoch: 120, batch: 500 // loss: 0.040\n", "epoch: 120, batch: 600 // loss: 0.040\n", "epoch: 120, batch: 700 // loss: 0.044\n", "epoch: 120, batch: 800 // loss: 0.042\n", "epoch: 120, batch: 900 // loss: 0.049\n", "epoch: 120, batch: 1000 // loss: 0.046\n", "epoch: 120, batch: 1100 // loss: 0.042\n", "epoch: 120, batch: 1200 // loss: 0.044\n", "epoch: 120, batch: 1300 // loss: 0.046\n", "epoch: 120, batch: 1400 // loss: 0.043\n", "epoch: 120, batch: 1500 // loss: 0.048\n", "epoch: 120, batch: 1600 // loss: 0.052\n", "epoch: 120, batch: 1700 // loss: 0.045\n", "epoch: 120, batch: 1800 // loss: 0.053\n", "epoch: 120, batch: 1900 // loss: 0.045\n", "epoch: 120, batch: 2000 // loss: 0.047\n", "epoch: 120, batch: 2100 // loss: 0.046\n", "epoch: 120, batch: 2200 // loss: 0.050\n", "epoch: 120, batch: 2300 // loss: 0.049\n", "epoch: 120, batch: 2400 // loss: 0.042\n", "epoch: 120, batch: 2500 // loss: 0.042\n", "epoch: 120, batch: 2600 // loss: 0.045\n", "epoch: 120, batch: 2700 // loss: 0.042\n", "epoch: 120, batch: 2800 // loss: 0.046\n", "epoch: 120, batch: 2900 // loss: 0.042\n", "epoch: 120, batch: 3000 // loss: 0.045\n", "epoch: 120, batch: 3100 // loss: 0.043\n", "epoch: 120, batch: 3200 // loss: 0.039\n", "epoch: 120, batch: 3300 // loss: 0.038\n", "epoch: 120, batch: 3400 // loss: 0.044\n", "epoch: 120, batch: 3500 // loss: 0.035\n", "epoch: 120, batch: 3600 // loss: 0.043\n", "epoch: 120, batch: 3700 // loss: 0.043\n", "\n", "epoch: 121, batch: 0 // loss: 0.053\n", "epoch: 121, batch: 100 // loss: 0.046\n", "epoch: 121, batch: 200 // loss: 0.043\n", "epoch: 121, batch: 300 // loss: 0.049\n", "epoch: 121, batch: 400 // loss: 0.046\n", "epoch: 121, batch: 500 // loss: 0.040\n", "epoch: 121, batch: 600 // loss: 0.040\n", "epoch: 121, batch: 700 // loss: 0.044\n", "epoch: 121, batch: 800 // loss: 0.042\n", "epoch: 121, batch: 900 // loss: 0.049\n", "epoch: 121, batch: 1000 // loss: 0.046\n", "epoch: 121, batch: 1100 // loss: 0.042\n", "epoch: 121, batch: 1200 // loss: 0.044\n", "epoch: 121, batch: 1300 // loss: 0.046\n", "epoch: 121, batch: 1400 // loss: 0.043\n", "epoch: 121, batch: 1500 // loss: 0.048\n", "epoch: 121, batch: 1600 // loss: 0.052\n", "epoch: 121, batch: 1700 // loss: 0.045\n", "epoch: 121, batch: 1800 // loss: 0.053\n", "epoch: 121, batch: 1900 // loss: 0.045\n", "epoch: 121, batch: 2000 // loss: 0.047\n", "epoch: 121, batch: 2100 // loss: 0.046\n", "epoch: 121, batch: 2200 // loss: 0.050\n", "epoch: 121, batch: 2300 // loss: 0.049\n", "epoch: 121, batch: 2400 // loss: 0.042\n", "epoch: 121, batch: 2500 // loss: 0.042\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 121, batch: 2600 // loss: 0.045\n", "epoch: 121, batch: 2700 // loss: 0.042\n", "epoch: 121, batch: 2800 // loss: 0.046\n", "epoch: 121, batch: 2900 // loss: 0.042\n", "epoch: 121, batch: 3000 // loss: 0.045\n", "epoch: 121, batch: 3100 // loss: 0.043\n", "epoch: 121, batch: 3200 // loss: 0.039\n", "epoch: 121, batch: 3300 // loss: 0.038\n", "epoch: 121, batch: 3400 // loss: 0.044\n", "epoch: 121, batch: 3500 // loss: 0.035\n", "epoch: 121, batch: 3600 // loss: 0.043\n", "epoch: 121, batch: 3700 // loss: 0.043\n", "\n", "epoch: 122, batch: 0 // loss: 0.053\n", "epoch: 122, batch: 100 // loss: 0.046\n", "epoch: 122, batch: 200 // loss: 0.043\n", "epoch: 122, batch: 300 // loss: 0.049\n", "epoch: 122, batch: 400 // loss: 0.046\n", "epoch: 122, batch: 500 // loss: 0.040\n", "epoch: 122, batch: 600 // loss: 0.040\n", "epoch: 122, batch: 700 // loss: 0.044\n", "epoch: 122, batch: 800 // loss: 0.042\n", "epoch: 122, batch: 900 // loss: 0.049\n", "epoch: 122, batch: 1000 // loss: 0.046\n", "epoch: 122, batch: 1100 // loss: 0.042\n", "epoch: 122, batch: 1200 // loss: 0.044\n", "epoch: 122, batch: 1300 // loss: 0.046\n", "epoch: 122, batch: 1400 // loss: 0.043\n", "epoch: 122, batch: 1500 // loss: 0.048\n", "epoch: 122, batch: 1600 // loss: 0.052\n", "epoch: 122, batch: 1700 // loss: 0.045\n", "epoch: 122, batch: 1800 // loss: 0.053\n", "epoch: 122, batch: 1900 // loss: 0.045\n", "epoch: 122, batch: 2000 // loss: 0.047\n", "epoch: 122, batch: 2100 // loss: 0.046\n", "epoch: 122, batch: 2200 // loss: 0.050\n", "epoch: 122, batch: 2300 // loss: 0.049\n", "epoch: 122, batch: 2400 // loss: 0.042\n", "epoch: 122, batch: 2500 // loss: 0.042\n", "epoch: 122, batch: 2600 // loss: 0.045\n", "epoch: 122, batch: 2700 // loss: 0.042\n", "epoch: 122, batch: 2800 // loss: 0.046\n", "epoch: 122, batch: 2900 // loss: 0.042\n", "epoch: 122, batch: 3000 // loss: 0.045\n", "epoch: 122, batch: 3100 // loss: 0.043\n", "epoch: 122, batch: 3200 // loss: 0.039\n", "epoch: 122, batch: 3300 // loss: 0.038\n", "epoch: 122, batch: 3400 // loss: 0.044\n", "epoch: 122, batch: 3500 // loss: 0.035\n", "epoch: 122, batch: 3600 // loss: 0.043\n", "epoch: 122, batch: 3700 // loss: 0.043\n", "\n", "epoch: 123, batch: 0 // loss: 0.053\n", "epoch: 123, batch: 100 // loss: 0.046\n", "epoch: 123, batch: 200 // loss: 0.043\n", "epoch: 123, batch: 300 // loss: 0.049\n", "epoch: 123, batch: 400 // loss: 0.046\n", "epoch: 123, batch: 500 // loss: 0.040\n", "epoch: 123, batch: 600 // loss: 0.040\n", "epoch: 123, batch: 700 // loss: 0.044\n", "epoch: 123, batch: 800 // loss: 0.042\n", "epoch: 123, batch: 900 // loss: 0.049\n", "epoch: 123, batch: 1000 // loss: 0.046\n", "epoch: 123, batch: 1100 // loss: 0.042\n", "epoch: 123, batch: 1200 // loss: 0.044\n", "epoch: 123, batch: 1300 // loss: 0.046\n", "epoch: 123, batch: 1400 // loss: 0.043\n", "epoch: 123, batch: 1500 // loss: 0.048\n", "epoch: 123, batch: 1600 // loss: 0.052\n", "epoch: 123, batch: 1700 // loss: 0.045\n", "epoch: 123, batch: 1800 // loss: 0.053\n", "epoch: 123, batch: 1900 // loss: 0.045\n", "epoch: 123, batch: 2000 // loss: 0.047\n", "epoch: 123, batch: 2100 // loss: 0.046\n", "epoch: 123, batch: 2200 // loss: 0.050\n", "epoch: 123, batch: 2300 // loss: 0.049\n", "epoch: 123, batch: 2400 // loss: 0.042\n", "epoch: 123, batch: 2500 // loss: 0.042\n", "epoch: 123, batch: 2600 // loss: 0.045\n", "epoch: 123, batch: 2700 // loss: 0.042\n", "epoch: 123, batch: 2800 // loss: 0.046\n", "epoch: 123, batch: 2900 // loss: 0.042\n", "epoch: 123, batch: 3000 // loss: 0.045\n", "epoch: 123, batch: 3100 // loss: 0.043\n", "epoch: 123, batch: 3200 // loss: 0.039\n", "epoch: 123, batch: 3300 // loss: 0.038\n", "epoch: 123, batch: 3400 // loss: 0.044\n", "epoch: 123, batch: 3500 // loss: 0.035\n", "epoch: 123, batch: 3600 // loss: 0.043\n", "epoch: 123, batch: 3700 // loss: 0.043\n", "\n", "epoch: 124, batch: 0 // loss: 0.053\n", "epoch: 124, batch: 100 // loss: 0.046\n", "epoch: 124, batch: 200 // loss: 0.043\n", "epoch: 124, batch: 300 // loss: 0.049\n", "epoch: 124, batch: 400 // loss: 0.046\n", "epoch: 124, batch: 500 // loss: 0.040\n", "epoch: 124, batch: 600 // loss: 0.040\n", "epoch: 124, batch: 700 // loss: 0.044\n", "epoch: 124, batch: 800 // loss: 0.042\n", "epoch: 124, batch: 900 // loss: 0.049\n", "epoch: 124, batch: 1000 // loss: 0.046\n", "epoch: 124, batch: 1100 // loss: 0.042\n", "epoch: 124, batch: 1200 // loss: 0.044\n", "epoch: 124, batch: 1300 // loss: 0.046\n", "epoch: 124, batch: 1400 // loss: 0.043\n", "epoch: 124, batch: 1500 // loss: 0.048\n", "epoch: 124, batch: 1600 // loss: 0.052\n", "epoch: 124, batch: 1700 // loss: 0.045\n", "epoch: 124, batch: 1800 // loss: 0.053\n", "epoch: 124, batch: 1900 // loss: 0.045\n", "epoch: 124, batch: 2000 // loss: 0.047\n", "epoch: 124, batch: 2100 // loss: 0.046\n", "epoch: 124, batch: 2200 // loss: 0.050\n", "epoch: 124, batch: 2300 // loss: 0.049\n", "epoch: 124, batch: 2400 // loss: 0.042\n", "epoch: 124, batch: 2500 // loss: 0.042\n", "epoch: 124, batch: 2600 // loss: 0.045\n", "epoch: 124, batch: 2700 // loss: 0.042\n", "epoch: 124, batch: 2800 // loss: 0.046\n", "epoch: 124, batch: 2900 // loss: 0.042\n", "epoch: 124, batch: 3000 // loss: 0.045\n", "epoch: 124, batch: 3100 // loss: 0.043\n", "epoch: 124, batch: 3200 // loss: 0.039\n", "epoch: 124, batch: 3300 // loss: 0.038\n", "epoch: 124, batch: 3400 // loss: 0.044\n", "epoch: 124, batch: 3500 // loss: 0.035\n", "epoch: 124, batch: 3600 // loss: 0.043\n", "epoch: 124, batch: 3700 // loss: 0.043\n", "\n", "epoch: 125, batch: 0 // loss: 0.053\n", "epoch: 125, batch: 100 // loss: 0.046\n", "epoch: 125, batch: 200 // loss: 0.043\n", "epoch: 125, batch: 300 // loss: 0.049\n", "epoch: 125, batch: 400 // loss: 0.046\n", "epoch: 125, batch: 500 // loss: 0.040\n", "epoch: 125, batch: 600 // loss: 0.040\n", "epoch: 125, batch: 700 // loss: 0.044\n", "epoch: 125, batch: 800 // loss: 0.042\n", "epoch: 125, batch: 900 // loss: 0.049\n", "epoch: 125, batch: 1000 // loss: 0.046\n", "epoch: 125, batch: 1100 // loss: 0.042\n", "epoch: 125, batch: 1200 // loss: 0.044\n", "epoch: 125, batch: 1300 // loss: 0.046\n", "epoch: 125, batch: 1400 // loss: 0.043\n", "epoch: 125, batch: 1500 // loss: 0.048\n", "epoch: 125, batch: 1600 // loss: 0.052\n", "epoch: 125, batch: 1700 // loss: 0.045\n", "epoch: 125, batch: 1800 // loss: 0.053\n", "epoch: 125, batch: 1900 // loss: 0.045\n", "epoch: 125, batch: 2000 // loss: 0.047\n", "epoch: 125, batch: 2100 // loss: 0.046\n", "epoch: 125, batch: 2200 // loss: 0.050\n", "epoch: 125, batch: 2300 // loss: 0.049\n", "epoch: 125, batch: 2400 // loss: 0.042\n", "epoch: 125, batch: 2500 // loss: 0.042\n", "epoch: 125, batch: 2600 // loss: 0.045\n", "epoch: 125, batch: 2700 // loss: 0.042\n", "epoch: 125, batch: 2800 // loss: 0.046\n", "epoch: 125, batch: 2900 // loss: 0.042\n", "epoch: 125, batch: 3000 // loss: 0.045\n", "epoch: 125, batch: 3100 // loss: 0.043\n", "epoch: 125, batch: 3200 // loss: 0.039\n", "epoch: 125, batch: 3300 // loss: 0.038\n", "epoch: 125, batch: 3400 // loss: 0.044\n", "epoch: 125, batch: 3500 // loss: 0.035\n", "epoch: 125, batch: 3600 // loss: 0.043\n", "epoch: 125, batch: 3700 // loss: 0.043\n", "\n", "epoch: 126, batch: 0 // loss: 0.053\n", "epoch: 126, batch: 100 // loss: 0.046\n", "epoch: 126, batch: 200 // loss: 0.043\n", "epoch: 126, batch: 300 // loss: 0.049\n", "epoch: 126, batch: 400 // loss: 0.046\n", "epoch: 126, batch: 500 // loss: 0.040\n", "epoch: 126, batch: 600 // loss: 0.040\n", "epoch: 126, batch: 700 // loss: 0.044\n", "epoch: 126, batch: 800 // loss: 0.042\n", "epoch: 126, batch: 900 // loss: 0.049\n", "epoch: 126, batch: 1000 // loss: 0.046\n", "epoch: 126, batch: 1100 // loss: 0.042\n", "epoch: 126, batch: 1200 // loss: 0.044\n", "epoch: 126, batch: 1300 // loss: 0.046\n", "epoch: 126, batch: 1400 // loss: 0.043\n", "epoch: 126, batch: 1500 // loss: 0.048\n", "epoch: 126, batch: 1600 // loss: 0.052\n", "epoch: 126, batch: 1700 // loss: 0.045\n", "epoch: 126, batch: 1800 // loss: 0.053\n", "epoch: 126, batch: 1900 // loss: 0.045\n", "epoch: 126, batch: 2000 // loss: 0.047\n", "epoch: 126, batch: 2100 // loss: 0.046\n", "epoch: 126, batch: 2200 // loss: 0.050\n", "epoch: 126, batch: 2300 // loss: 0.049\n", "epoch: 126, batch: 2400 // loss: 0.042\n", "epoch: 126, batch: 2500 // loss: 0.042\n", "epoch: 126, batch: 2600 // loss: 0.045\n", "epoch: 126, batch: 2700 // loss: 0.042\n", "epoch: 126, batch: 2800 // loss: 0.046\n", "epoch: 126, batch: 2900 // loss: 0.042\n", "epoch: 126, batch: 3000 // loss: 0.045\n", "epoch: 126, batch: 3100 // loss: 0.043\n", "epoch: 126, batch: 3200 // loss: 0.039\n", "epoch: 126, batch: 3300 // loss: 0.038\n", "epoch: 126, batch: 3400 // loss: 0.044\n", "epoch: 126, batch: 3500 // loss: 0.035\n", "epoch: 126, batch: 3600 // loss: 0.043\n", "epoch: 126, batch: 3700 // loss: 0.043\n", "\n", "epoch: 127, batch: 0 // loss: 0.053\n", "epoch: 127, batch: 100 // loss: 0.046\n", "epoch: 127, batch: 200 // loss: 0.043\n", "epoch: 127, batch: 300 // loss: 0.049\n", "epoch: 127, batch: 400 // loss: 0.046\n", "epoch: 127, batch: 500 // loss: 0.040\n", "epoch: 127, batch: 600 // loss: 0.040\n", "epoch: 127, batch: 700 // loss: 0.044\n", "epoch: 127, batch: 800 // loss: 0.042\n", "epoch: 127, batch: 900 // loss: 0.049\n", "epoch: 127, batch: 1000 // loss: 0.046\n", "epoch: 127, batch: 1100 // loss: 0.042\n", "epoch: 127, batch: 1200 // loss: 0.044\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 127, batch: 1300 // loss: 0.046\n", "epoch: 127, batch: 1400 // loss: 0.043\n", "epoch: 127, batch: 1500 // loss: 0.048\n", "epoch: 127, batch: 1600 // loss: 0.052\n", "epoch: 127, batch: 1700 // loss: 0.045\n", "epoch: 127, batch: 1800 // loss: 0.053\n", "epoch: 127, batch: 1900 // loss: 0.045\n", "epoch: 127, batch: 2000 // loss: 0.047\n", "epoch: 127, batch: 2100 // loss: 0.046\n", "epoch: 127, batch: 2200 // loss: 0.050\n", "epoch: 127, batch: 2300 // loss: 0.049\n", "epoch: 127, batch: 2400 // loss: 0.042\n", "epoch: 127, batch: 2500 // loss: 0.042\n", "epoch: 127, batch: 2600 // loss: 0.045\n", "epoch: 127, batch: 2700 // loss: 0.042\n", "epoch: 127, batch: 2800 // loss: 0.046\n", "epoch: 127, batch: 2900 // loss: 0.042\n", "epoch: 127, batch: 3000 // loss: 0.045\n", "epoch: 127, batch: 3100 // loss: 0.043\n", "epoch: 127, batch: 3200 // loss: 0.039\n", "epoch: 127, batch: 3300 // loss: 0.038\n", "epoch: 127, batch: 3400 // loss: 0.044\n", "epoch: 127, batch: 3500 // loss: 0.035\n", "epoch: 127, batch: 3600 // loss: 0.043\n", "epoch: 127, batch: 3700 // loss: 0.043\n", "\n", "epoch: 128, batch: 0 // loss: 0.053\n", "epoch: 128, batch: 100 // loss: 0.046\n", "epoch: 128, batch: 200 // loss: 0.043\n", "epoch: 128, batch: 300 // loss: 0.049\n", "epoch: 128, batch: 400 // loss: 0.046\n", "epoch: 128, batch: 500 // loss: 0.040\n", "epoch: 128, batch: 600 // loss: 0.040\n", "epoch: 128, batch: 700 // loss: 0.044\n", "epoch: 128, batch: 800 // loss: 0.042\n", "epoch: 128, batch: 900 // loss: 0.049\n", "epoch: 128, batch: 1000 // loss: 0.046\n", "epoch: 128, batch: 1100 // loss: 0.042\n", "epoch: 128, batch: 1200 // loss: 0.044\n", "epoch: 128, batch: 1300 // loss: 0.046\n", "epoch: 128, batch: 1400 // loss: 0.043\n", "epoch: 128, batch: 1500 // loss: 0.048\n", "epoch: 128, batch: 1600 // loss: 0.052\n", "epoch: 128, batch: 1700 // loss: 0.045\n", "epoch: 128, batch: 1800 // loss: 0.053\n", "epoch: 128, batch: 1900 // loss: 0.045\n", "epoch: 128, batch: 2000 // loss: 0.047\n", "epoch: 128, batch: 2100 // loss: 0.046\n", "epoch: 128, batch: 2200 // loss: 0.050\n", "epoch: 128, batch: 2300 // loss: 0.049\n", "epoch: 128, batch: 2400 // loss: 0.042\n", "epoch: 128, batch: 2500 // loss: 0.042\n", "epoch: 128, batch: 2600 // loss: 0.045\n", "epoch: 128, batch: 2700 // loss: 0.042\n", "epoch: 128, batch: 2800 // loss: 0.046\n", "epoch: 128, batch: 2900 // loss: 0.042\n", "epoch: 128, batch: 3000 // loss: 0.045\n", "epoch: 128, batch: 3100 // loss: 0.043\n", "epoch: 128, batch: 3200 // loss: 0.039\n", "epoch: 128, batch: 3300 // loss: 0.038\n", "epoch: 128, batch: 3400 // loss: 0.044\n", "epoch: 128, batch: 3500 // loss: 0.035\n", "epoch: 128, batch: 3600 // loss: 0.043\n", "epoch: 128, batch: 3700 // loss: 0.043\n", "\n", "epoch: 129, batch: 0 // loss: 0.053\n", "epoch: 129, batch: 100 // loss: 0.046\n", "epoch: 129, batch: 200 // loss: 0.043\n", "epoch: 129, batch: 300 // loss: 0.049\n", "epoch: 129, batch: 400 // loss: 0.046\n", "epoch: 129, batch: 500 // loss: 0.040\n", "epoch: 129, batch: 600 // loss: 0.040\n", "epoch: 129, batch: 700 // loss: 0.044\n", "epoch: 129, batch: 800 // loss: 0.042\n", "epoch: 129, batch: 900 // loss: 0.049\n", "epoch: 129, batch: 1000 // loss: 0.046\n", "epoch: 129, batch: 1100 // loss: 0.042\n", "epoch: 129, batch: 1200 // loss: 0.044\n", "epoch: 129, batch: 1300 // loss: 0.046\n", "epoch: 129, batch: 1400 // loss: 0.043\n", "epoch: 129, batch: 1500 // loss: 0.048\n", "epoch: 129, batch: 1600 // loss: 0.052\n", "epoch: 129, batch: 1700 // loss: 0.045\n", "epoch: 129, batch: 1800 // loss: 0.053\n", "epoch: 129, batch: 1900 // loss: 0.045\n", "epoch: 129, batch: 2000 // loss: 0.047\n", "epoch: 129, batch: 2100 // loss: 0.046\n", "epoch: 129, batch: 2200 // loss: 0.050\n", "epoch: 129, batch: 2300 // loss: 0.049\n", "epoch: 129, batch: 2400 // loss: 0.042\n", "epoch: 129, batch: 2500 // loss: 0.042\n", "epoch: 129, batch: 2600 // loss: 0.045\n", "epoch: 129, batch: 2700 // loss: 0.042\n", "epoch: 129, batch: 2800 // loss: 0.046\n", "epoch: 129, batch: 2900 // loss: 0.042\n", "epoch: 129, batch: 3000 // loss: 0.045\n", "epoch: 129, batch: 3100 // loss: 0.043\n", "epoch: 129, batch: 3200 // loss: 0.039\n", "epoch: 129, batch: 3300 // loss: 0.038\n", "epoch: 129, batch: 3400 // loss: 0.044\n", "epoch: 129, batch: 3500 // loss: 0.035\n", "epoch: 129, batch: 3600 // loss: 0.043\n", "epoch: 129, batch: 3700 // loss: 0.043\n", "\n", "epoch: 130, batch: 0 // loss: 0.053\n", "epoch: 130, batch: 100 // loss: 0.046\n", "epoch: 130, batch: 200 // loss: 0.043\n", "epoch: 130, batch: 300 // loss: 0.049\n", "epoch: 130, batch: 400 // loss: 0.046\n", "epoch: 130, batch: 500 // loss: 0.040\n", "epoch: 130, batch: 600 // loss: 0.040\n", "epoch: 130, batch: 700 // loss: 0.044\n", "epoch: 130, batch: 800 // loss: 0.042\n", "epoch: 130, batch: 900 // loss: 0.049\n", "epoch: 130, batch: 1000 // loss: 0.046\n", "epoch: 130, batch: 1100 // loss: 0.042\n", "epoch: 130, batch: 1200 // loss: 0.044\n", "epoch: 130, batch: 1300 // loss: 0.046\n", "epoch: 130, batch: 1400 // loss: 0.043\n", "epoch: 130, batch: 1500 // loss: 0.048\n", "epoch: 130, batch: 1600 // loss: 0.052\n", "epoch: 130, batch: 1700 // loss: 0.045\n", "epoch: 130, batch: 1800 // loss: 0.053\n", "epoch: 130, batch: 1900 // loss: 0.045\n", "epoch: 130, batch: 2000 // loss: 0.047\n", "epoch: 130, batch: 2100 // loss: 0.046\n", "epoch: 130, batch: 2200 // loss: 0.050\n", "epoch: 130, batch: 2300 // loss: 0.049\n", "epoch: 130, batch: 2400 // loss: 0.042\n", "epoch: 130, batch: 2500 // loss: 0.042\n", "epoch: 130, batch: 2600 // loss: 0.045\n", "epoch: 130, batch: 2700 // loss: 0.042\n", "epoch: 130, batch: 2800 // loss: 0.046\n", "epoch: 130, batch: 2900 // loss: 0.042\n", "epoch: 130, batch: 3000 // loss: 0.045\n", "epoch: 130, batch: 3100 // loss: 0.043\n", "epoch: 130, batch: 3200 // loss: 0.039\n", "epoch: 130, batch: 3300 // loss: 0.038\n", "epoch: 130, batch: 3400 // loss: 0.044\n", "epoch: 130, batch: 3500 // loss: 0.035\n", "epoch: 130, batch: 3600 // loss: 0.043\n", "epoch: 130, batch: 3700 // loss: 0.043\n", "\n", "epoch: 131, batch: 0 // loss: 0.053\n", "epoch: 131, batch: 100 // loss: 0.046\n", "epoch: 131, batch: 200 // loss: 0.043\n", "epoch: 131, batch: 300 // loss: 0.049\n", "epoch: 131, batch: 400 // loss: 0.046\n", "epoch: 131, batch: 500 // loss: 0.040\n", "epoch: 131, batch: 600 // loss: 0.040\n", "epoch: 131, batch: 700 // loss: 0.044\n", "epoch: 131, batch: 800 // loss: 0.042\n", "epoch: 131, batch: 900 // loss: 0.049\n", "epoch: 131, batch: 1000 // loss: 0.046\n", "epoch: 131, batch: 1100 // loss: 0.042\n", "epoch: 131, batch: 1200 // loss: 0.044\n", "epoch: 131, batch: 1300 // loss: 0.046\n", "epoch: 131, batch: 1400 // loss: 0.043\n", "epoch: 131, batch: 1500 // loss: 0.048\n", "epoch: 131, batch: 1600 // loss: 0.052\n", "epoch: 131, batch: 1700 // loss: 0.045\n", "epoch: 131, batch: 1800 // loss: 0.053\n", "epoch: 131, batch: 1900 // loss: 0.045\n", "epoch: 131, batch: 2000 // loss: 0.047\n", "epoch: 131, batch: 2100 // loss: 0.046\n", "epoch: 131, batch: 2200 // loss: 0.050\n", "epoch: 131, batch: 2300 // loss: 0.049\n", "epoch: 131, batch: 2400 // loss: 0.042\n", "epoch: 131, batch: 2500 // loss: 0.042\n", "epoch: 131, batch: 2600 // loss: 0.045\n", "epoch: 131, batch: 2700 // loss: 0.042\n", "epoch: 131, batch: 2800 // loss: 0.046\n", "epoch: 131, batch: 2900 // loss: 0.042\n", "epoch: 131, batch: 3000 // loss: 0.045\n", "epoch: 131, batch: 3100 // loss: 0.043\n", "epoch: 131, batch: 3200 // loss: 0.039\n", "epoch: 131, batch: 3300 // loss: 0.038\n", "epoch: 131, batch: 3400 // loss: 0.044\n", "epoch: 131, batch: 3500 // loss: 0.035\n", "epoch: 131, batch: 3600 // loss: 0.043\n", "epoch: 131, batch: 3700 // loss: 0.043\n", "\n", "epoch: 132, batch: 0 // loss: 0.053\n", "epoch: 132, batch: 100 // loss: 0.046\n", "epoch: 132, batch: 200 // loss: 0.043\n", "epoch: 132, batch: 300 // loss: 0.049\n", "epoch: 132, batch: 400 // loss: 0.046\n", "epoch: 132, batch: 500 // loss: 0.040\n", "epoch: 132, batch: 600 // loss: 0.040\n", "epoch: 132, batch: 700 // loss: 0.044\n", "epoch: 132, batch: 800 // loss: 0.042\n", "epoch: 132, batch: 900 // loss: 0.049\n", "epoch: 132, batch: 1000 // loss: 0.046\n", "epoch: 132, batch: 1100 // loss: 0.042\n", "epoch: 132, batch: 1200 // loss: 0.044\n", "epoch: 132, batch: 1300 // loss: 0.046\n", "epoch: 132, batch: 1400 // loss: 0.043\n", "epoch: 132, batch: 1500 // loss: 0.048\n", "epoch: 132, batch: 1600 // loss: 0.052\n", "epoch: 132, batch: 1700 // loss: 0.045\n", "epoch: 132, batch: 1800 // loss: 0.053\n", "epoch: 132, batch: 1900 // loss: 0.045\n", "epoch: 132, batch: 2000 // loss: 0.047\n", "epoch: 132, batch: 2100 // loss: 0.046\n", "epoch: 132, batch: 2200 // loss: 0.050\n", "epoch: 132, batch: 2300 // loss: 0.049\n", "epoch: 132, batch: 2400 // loss: 0.042\n", "epoch: 132, batch: 2500 // loss: 0.042\n", "epoch: 132, batch: 2600 // loss: 0.045\n", "epoch: 132, batch: 2700 // loss: 0.042\n", "epoch: 132, batch: 2800 // loss: 0.046\n", "epoch: 132, batch: 2900 // loss: 0.042\n", "epoch: 132, batch: 3000 // loss: 0.045\n", "epoch: 132, batch: 3100 // loss: 0.043\n", "epoch: 132, batch: 3200 // loss: 0.039\n", "epoch: 132, batch: 3300 // loss: 0.038\n", "epoch: 132, batch: 3400 // loss: 0.044\n", "epoch: 132, batch: 3500 // loss: 0.035\n", "epoch: 132, batch: 3600 // loss: 0.043\n", "epoch: 132, batch: 3700 // loss: 0.043\n", "\n", "epoch: 133, batch: 0 // loss: 0.053\n", "epoch: 133, batch: 100 // loss: 0.046\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 133, batch: 200 // loss: 0.043\n", "epoch: 133, batch: 300 // loss: 0.049\n", "epoch: 133, batch: 400 // loss: 0.046\n", "epoch: 133, batch: 500 // loss: 0.040\n", "epoch: 133, batch: 600 // loss: 0.040\n", "epoch: 133, batch: 700 // loss: 0.044\n", "epoch: 133, batch: 800 // loss: 0.042\n", "epoch: 133, batch: 900 // loss: 0.049\n", "epoch: 133, batch: 1000 // loss: 0.046\n", "epoch: 133, batch: 1100 // loss: 0.042\n", "epoch: 133, batch: 1200 // loss: 0.044\n", "epoch: 133, batch: 1300 // loss: 0.046\n", "epoch: 133, batch: 1400 // loss: 0.043\n", "epoch: 133, batch: 1500 // loss: 0.048\n", "epoch: 133, batch: 1600 // loss: 0.052\n", "epoch: 133, batch: 1700 // loss: 0.045\n", "epoch: 133, batch: 1800 // loss: 0.053\n", "epoch: 133, batch: 1900 // loss: 0.045\n", "epoch: 133, batch: 2000 // loss: 0.047\n", "epoch: 133, batch: 2100 // loss: 0.046\n", "epoch: 133, batch: 2200 // loss: 0.050\n", "epoch: 133, batch: 2300 // loss: 0.049\n", "epoch: 133, batch: 2400 // loss: 0.042\n", "epoch: 133, batch: 2500 // loss: 0.042\n", "epoch: 133, batch: 2600 // loss: 0.045\n", "epoch: 133, batch: 2700 // loss: 0.042\n", "epoch: 133, batch: 2800 // loss: 0.046\n", "epoch: 133, batch: 2900 // loss: 0.042\n", "epoch: 133, batch: 3000 // loss: 0.045\n", "epoch: 133, batch: 3100 // loss: 0.043\n", "epoch: 133, batch: 3200 // loss: 0.039\n", "epoch: 133, batch: 3300 // loss: 0.038\n", "epoch: 133, batch: 3400 // loss: 0.044\n", "epoch: 133, batch: 3500 // loss: 0.035\n", "epoch: 133, batch: 3600 // loss: 0.043\n", "epoch: 133, batch: 3700 // loss: 0.043\n", "\n", "epoch: 134, batch: 0 // loss: 0.053\n", "epoch: 134, batch: 100 // loss: 0.046\n", "epoch: 134, batch: 200 // loss: 0.043\n", "epoch: 134, batch: 300 // loss: 0.049\n", "epoch: 134, batch: 400 // loss: 0.046\n", "epoch: 134, batch: 500 // loss: 0.040\n", "epoch: 134, batch: 600 // loss: 0.040\n", "epoch: 134, batch: 700 // loss: 0.044\n", "epoch: 134, batch: 800 // loss: 0.042\n", "epoch: 134, batch: 900 // loss: 0.049\n", "epoch: 134, batch: 1000 // loss: 0.046\n", "epoch: 134, batch: 1100 // loss: 0.042\n", "epoch: 134, batch: 1200 // loss: 0.044\n", "epoch: 134, batch: 1300 // loss: 0.046\n", "epoch: 134, batch: 1400 // loss: 0.043\n", "epoch: 134, batch: 1500 // loss: 0.048\n", "epoch: 134, batch: 1600 // loss: 0.052\n", "epoch: 134, batch: 1700 // loss: 0.045\n", "epoch: 134, batch: 1800 // loss: 0.053\n", "epoch: 134, batch: 1900 // loss: 0.045\n", "epoch: 134, batch: 2000 // loss: 0.047\n", "epoch: 134, batch: 2100 // loss: 0.046\n", "epoch: 134, batch: 2200 // loss: 0.050\n", "epoch: 134, batch: 2300 // loss: 0.049\n", "epoch: 134, batch: 2400 // loss: 0.042\n", "epoch: 134, batch: 2500 // loss: 0.042\n", "epoch: 134, batch: 2600 // loss: 0.045\n", "epoch: 134, batch: 2700 // loss: 0.042\n", "epoch: 134, batch: 2800 // loss: 0.046\n", "epoch: 134, batch: 2900 // loss: 0.042\n", "epoch: 134, batch: 3000 // loss: 0.045\n", "epoch: 134, batch: 3100 // loss: 0.043\n", "epoch: 134, batch: 3200 // loss: 0.039\n", "epoch: 134, batch: 3300 // loss: 0.038\n", "epoch: 134, batch: 3400 // loss: 0.044\n", "epoch: 134, batch: 3500 // loss: 0.035\n", "epoch: 134, batch: 3600 // loss: 0.043\n", "epoch: 134, batch: 3700 // loss: 0.043\n", "\n", "epoch: 135, batch: 0 // loss: 0.053\n", "epoch: 135, batch: 100 // loss: 0.046\n", "epoch: 135, batch: 200 // loss: 0.043\n", "epoch: 135, batch: 300 // loss: 0.049\n", "epoch: 135, batch: 400 // loss: 0.046\n", "epoch: 135, batch: 500 // loss: 0.040\n", "epoch: 135, batch: 600 // loss: 0.040\n", "epoch: 135, batch: 700 // loss: 0.044\n", "epoch: 135, batch: 800 // loss: 0.042\n", "epoch: 135, batch: 900 // loss: 0.049\n", "epoch: 135, batch: 1000 // loss: 0.046\n", "epoch: 135, batch: 1100 // loss: 0.042\n", "epoch: 135, batch: 1200 // loss: 0.044\n", "epoch: 135, batch: 1300 // loss: 0.046\n", "epoch: 135, batch: 1400 // loss: 0.043\n", "epoch: 135, batch: 1500 // loss: 0.048\n", "epoch: 135, batch: 1600 // loss: 0.052\n", "epoch: 135, batch: 1700 // loss: 0.045\n", "epoch: 135, batch: 1800 // loss: 0.053\n", "epoch: 135, batch: 1900 // loss: 0.045\n", "epoch: 135, batch: 2000 // loss: 0.047\n", "epoch: 135, batch: 2100 // loss: 0.046\n", "epoch: 135, batch: 2200 // loss: 0.050\n", "epoch: 135, batch: 2300 // loss: 0.049\n", "epoch: 135, batch: 2400 // loss: 0.042\n", "epoch: 135, batch: 2500 // loss: 0.042\n", "epoch: 135, batch: 2600 // loss: 0.045\n", "epoch: 135, batch: 2700 // loss: 0.042\n", "epoch: 135, batch: 2800 // loss: 0.046\n", "epoch: 135, batch: 2900 // loss: 0.042\n", "epoch: 135, batch: 3000 // loss: 0.045\n", "epoch: 135, batch: 3100 // loss: 0.043\n", "epoch: 135, batch: 3200 // loss: 0.039\n", "epoch: 135, batch: 3300 // loss: 0.038\n", "epoch: 135, batch: 3400 // loss: 0.044\n", "epoch: 135, batch: 3500 // loss: 0.035\n", "epoch: 135, batch: 3600 // loss: 0.043\n", "epoch: 135, batch: 3700 // loss: 0.043\n", "\n", "epoch: 136, batch: 0 // loss: 0.053\n", "epoch: 136, batch: 100 // loss: 0.046\n", "epoch: 136, batch: 200 // loss: 0.043\n", "epoch: 136, batch: 300 // loss: 0.049\n", "epoch: 136, batch: 400 // loss: 0.046\n", "epoch: 136, batch: 500 // loss: 0.040\n", "epoch: 136, batch: 600 // loss: 0.040\n", "epoch: 136, batch: 700 // loss: 0.044\n", "epoch: 136, batch: 800 // loss: 0.042\n", "epoch: 136, batch: 900 // loss: 0.049\n", "epoch: 136, batch: 1000 // loss: 0.046\n", "epoch: 136, batch: 1100 // loss: 0.042\n", "epoch: 136, batch: 1200 // loss: 0.044\n", "epoch: 136, batch: 1300 // loss: 0.046\n", "epoch: 136, batch: 1400 // loss: 0.043\n", "epoch: 136, batch: 1500 // loss: 0.048\n", "epoch: 136, batch: 1600 // loss: 0.052\n", "epoch: 136, batch: 1700 // loss: 0.045\n", "epoch: 136, batch: 1800 // loss: 0.053\n", "epoch: 136, batch: 1900 // loss: 0.045\n", "epoch: 136, batch: 2000 // loss: 0.047\n", "epoch: 136, batch: 2100 // loss: 0.046\n", "epoch: 136, batch: 2200 // loss: 0.050\n", "epoch: 136, batch: 2300 // loss: 0.049\n", "epoch: 136, batch: 2400 // loss: 0.042\n", "epoch: 136, batch: 2500 // loss: 0.042\n", "epoch: 136, batch: 2600 // loss: 0.045\n", "epoch: 136, batch: 2700 // loss: 0.042\n", "epoch: 136, batch: 2800 // loss: 0.046\n", "epoch: 136, batch: 2900 // loss: 0.042\n", "epoch: 136, batch: 3000 // loss: 0.045\n", "epoch: 136, batch: 3100 // loss: 0.043\n", "epoch: 136, batch: 3200 // loss: 0.039\n", "epoch: 136, batch: 3300 // loss: 0.038\n", "epoch: 136, batch: 3400 // loss: 0.044\n", "epoch: 136, batch: 3500 // loss: 0.035\n", "epoch: 136, batch: 3600 // loss: 0.043\n", "epoch: 136, batch: 3700 // loss: 0.043\n", "\n", "epoch: 137, batch: 0 // loss: 0.053\n", "epoch: 137, batch: 100 // loss: 0.046\n", "epoch: 137, batch: 200 // loss: 0.043\n", "epoch: 137, batch: 300 // loss: 0.049\n", "epoch: 137, batch: 400 // loss: 0.046\n", "epoch: 137, batch: 500 // loss: 0.040\n", "epoch: 137, batch: 600 // loss: 0.040\n", "epoch: 137, batch: 700 // loss: 0.044\n", "epoch: 137, batch: 800 // loss: 0.042\n", "epoch: 137, batch: 900 // loss: 0.049\n", "epoch: 137, batch: 1000 // loss: 0.046\n", "epoch: 137, batch: 1100 // loss: 0.042\n", "epoch: 137, batch: 1200 // loss: 0.044\n", "epoch: 137, batch: 1300 // loss: 0.046\n", "epoch: 137, batch: 1400 // loss: 0.043\n", "epoch: 137, batch: 1500 // loss: 0.048\n", "epoch: 137, batch: 1600 // loss: 0.052\n", "epoch: 137, batch: 1700 // loss: 0.045\n", "epoch: 137, batch: 1800 // loss: 0.053\n", "epoch: 137, batch: 1900 // loss: 0.045\n", "epoch: 137, batch: 2000 // loss: 0.047\n", "epoch: 137, batch: 2100 // loss: 0.046\n", "epoch: 137, batch: 2200 // loss: 0.050\n", "epoch: 137, batch: 2300 // loss: 0.049\n", "epoch: 137, batch: 2400 // loss: 0.042\n", "epoch: 137, batch: 2500 // loss: 0.042\n", "epoch: 137, batch: 2600 // loss: 0.045\n", "epoch: 137, batch: 2700 // loss: 0.042\n", "epoch: 137, batch: 2800 // loss: 0.046\n", "epoch: 137, batch: 2900 // loss: 0.042\n", "epoch: 137, batch: 3000 // loss: 0.045\n", "epoch: 137, batch: 3100 // loss: 0.043\n", "epoch: 137, batch: 3200 // loss: 0.039\n", "epoch: 137, batch: 3300 // loss: 0.038\n", "epoch: 137, batch: 3400 // loss: 0.044\n", "epoch: 137, batch: 3500 // loss: 0.035\n", "epoch: 137, batch: 3600 // loss: 0.043\n", "epoch: 137, batch: 3700 // loss: 0.043\n", "\n", "epoch: 138, batch: 0 // loss: 0.053\n", "epoch: 138, batch: 100 // loss: 0.046\n", "epoch: 138, batch: 200 // loss: 0.043\n", "epoch: 138, batch: 300 // loss: 0.049\n", "epoch: 138, batch: 400 // loss: 0.046\n", "epoch: 138, batch: 500 // loss: 0.040\n", "epoch: 138, batch: 600 // loss: 0.040\n", "epoch: 138, batch: 700 // loss: 0.044\n", "epoch: 138, batch: 800 // loss: 0.042\n", "epoch: 138, batch: 900 // loss: 0.049\n", "epoch: 138, batch: 1000 // loss: 0.046\n", "epoch: 138, batch: 1100 // loss: 0.042\n", "epoch: 138, batch: 1200 // loss: 0.044\n", "epoch: 138, batch: 1300 // loss: 0.046\n", "epoch: 138, batch: 1400 // loss: 0.043\n", "epoch: 138, batch: 1500 // loss: 0.048\n", "epoch: 138, batch: 1600 // loss: 0.052\n", "epoch: 138, batch: 1700 // loss: 0.045\n", "epoch: 138, batch: 1800 // loss: 0.053\n", "epoch: 138, batch: 1900 // loss: 0.045\n", "epoch: 138, batch: 2000 // loss: 0.047\n", "epoch: 138, batch: 2100 // loss: 0.046\n", "epoch: 138, batch: 2200 // loss: 0.050\n", "epoch: 138, batch: 2300 // loss: 0.049\n", "epoch: 138, batch: 2400 // loss: 0.042\n", "epoch: 138, batch: 2500 // loss: 0.042\n", "epoch: 138, batch: 2600 // loss: 0.045\n", "epoch: 138, batch: 2700 // loss: 0.042\n", "epoch: 138, batch: 2800 // loss: 0.046\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 138, batch: 2900 // loss: 0.042\n", "epoch: 138, batch: 3000 // loss: 0.045\n", "epoch: 138, batch: 3100 // loss: 0.043\n", "epoch: 138, batch: 3200 // loss: 0.039\n", "epoch: 138, batch: 3300 // loss: 0.038\n", "epoch: 138, batch: 3400 // loss: 0.044\n", "epoch: 138, batch: 3500 // loss: 0.035\n", "epoch: 138, batch: 3600 // loss: 0.043\n", "epoch: 138, batch: 3700 // loss: 0.043\n", "\n", "epoch: 139, batch: 0 // loss: 0.053\n", "epoch: 139, batch: 100 // loss: 0.046\n", "epoch: 139, batch: 200 // loss: 0.043\n", "epoch: 139, batch: 300 // loss: 0.049\n", "epoch: 139, batch: 400 // loss: 0.046\n", "epoch: 139, batch: 500 // loss: 0.040\n", "epoch: 139, batch: 600 // loss: 0.040\n", "epoch: 139, batch: 700 // loss: 0.044\n", "epoch: 139, batch: 800 // loss: 0.042\n", "epoch: 139, batch: 900 // loss: 0.049\n", "epoch: 139, batch: 1000 // loss: 0.046\n", "epoch: 139, batch: 1100 // loss: 0.042\n", "epoch: 139, batch: 1200 // loss: 0.044\n", "epoch: 139, batch: 1300 // loss: 0.046\n", "epoch: 139, batch: 1400 // loss: 0.043\n", "epoch: 139, batch: 1500 // loss: 0.048\n", "epoch: 139, batch: 1600 // loss: 0.052\n", "epoch: 139, batch: 1700 // loss: 0.045\n", "epoch: 139, batch: 1800 // loss: 0.053\n", "epoch: 139, batch: 1900 // loss: 0.045\n", "epoch: 139, batch: 2000 // loss: 0.047\n", "epoch: 139, batch: 2100 // loss: 0.046\n", "epoch: 139, batch: 2200 // loss: 0.050\n", "epoch: 139, batch: 2300 // loss: 0.049\n", "epoch: 139, batch: 2400 // loss: 0.042\n", "epoch: 139, batch: 2500 // loss: 0.042\n", "epoch: 139, batch: 2600 // loss: 0.045\n", "epoch: 139, batch: 2700 // loss: 0.042\n", "epoch: 139, batch: 2800 // loss: 0.046\n", "epoch: 139, batch: 2900 // loss: 0.042\n", "epoch: 139, batch: 3000 // loss: 0.045\n", "epoch: 139, batch: 3100 // loss: 0.043\n", "epoch: 139, batch: 3200 // loss: 0.039\n", "epoch: 139, batch: 3300 // loss: 0.038\n", "epoch: 139, batch: 3400 // loss: 0.044\n", "epoch: 139, batch: 3500 // loss: 0.035\n", "epoch: 139, batch: 3600 // loss: 0.043\n", "epoch: 139, batch: 3700 // loss: 0.043\n", "\n", "epoch: 140, batch: 0 // loss: 0.053\n", "epoch: 140, batch: 100 // loss: 0.046\n", "epoch: 140, batch: 200 // loss: 0.043\n", "epoch: 140, batch: 300 // loss: 0.049\n", "epoch: 140, batch: 400 // loss: 0.046\n", "epoch: 140, batch: 500 // loss: 0.040\n", "epoch: 140, batch: 600 // loss: 0.040\n", "epoch: 140, batch: 700 // loss: 0.044\n", "epoch: 140, batch: 800 // loss: 0.042\n", "epoch: 140, batch: 900 // loss: 0.049\n", "epoch: 140, batch: 1000 // loss: 0.046\n", "epoch: 140, batch: 1100 // loss: 0.042\n", "epoch: 140, batch: 1200 // loss: 0.044\n", "epoch: 140, batch: 1300 // loss: 0.046\n", "epoch: 140, batch: 1400 // loss: 0.043\n", "epoch: 140, batch: 1500 // loss: 0.048\n", "epoch: 140, batch: 1600 // loss: 0.052\n", "epoch: 140, batch: 1700 // loss: 0.045\n", "epoch: 140, batch: 1800 // loss: 0.053\n", "epoch: 140, batch: 1900 // loss: 0.045\n", "epoch: 140, batch: 2000 // loss: 0.047\n", "epoch: 140, batch: 2100 // loss: 0.046\n", "epoch: 140, batch: 2200 // loss: 0.050\n", "epoch: 140, batch: 2300 // loss: 0.049\n", "epoch: 140, batch: 2400 // loss: 0.042\n", "epoch: 140, batch: 2500 // loss: 0.042\n", "epoch: 140, batch: 2600 // loss: 0.045\n", "epoch: 140, batch: 2700 // loss: 0.042\n", "epoch: 140, batch: 2800 // loss: 0.046\n", "epoch: 140, batch: 2900 // loss: 0.042\n", "epoch: 140, batch: 3000 // loss: 0.045\n", "epoch: 140, batch: 3100 // loss: 0.043\n", "epoch: 140, batch: 3200 // loss: 0.039\n", "epoch: 140, batch: 3300 // loss: 0.038\n", "epoch: 140, batch: 3400 // loss: 0.044\n", "epoch: 140, batch: 3500 // loss: 0.035\n", "epoch: 140, batch: 3600 // loss: 0.043\n", "epoch: 140, batch: 3700 // loss: 0.043\n", "\n", "epoch: 141, batch: 0 // loss: 0.053\n", "epoch: 141, batch: 100 // loss: 0.046\n", "epoch: 141, batch: 200 // loss: 0.043\n", "epoch: 141, batch: 300 // loss: 0.049\n", "epoch: 141, batch: 400 // loss: 0.046\n", "epoch: 141, batch: 500 // loss: 0.040\n", "epoch: 141, batch: 600 // loss: 0.040\n", "epoch: 141, batch: 700 // loss: 0.044\n", "epoch: 141, batch: 800 // loss: 0.042\n", "epoch: 141, batch: 900 // loss: 0.049\n", "epoch: 141, batch: 1000 // loss: 0.046\n", "epoch: 141, batch: 1100 // loss: 0.042\n", "epoch: 141, batch: 1200 // loss: 0.044\n", "epoch: 141, batch: 1300 // loss: 0.046\n", "epoch: 141, batch: 1400 // loss: 0.043\n", "epoch: 141, batch: 1500 // loss: 0.048\n", "epoch: 141, batch: 1600 // loss: 0.052\n", "epoch: 141, batch: 1700 // loss: 0.045\n", "epoch: 141, batch: 1800 // loss: 0.053\n", "epoch: 141, batch: 1900 // loss: 0.045\n", "epoch: 141, batch: 2000 // loss: 0.047\n", "epoch: 141, batch: 2100 // loss: 0.046\n", "epoch: 141, batch: 2200 // loss: 0.050\n", "epoch: 141, batch: 2300 // loss: 0.049\n", "epoch: 141, batch: 2400 // loss: 0.042\n", "epoch: 141, batch: 2500 // loss: 0.042\n", "epoch: 141, batch: 2600 // loss: 0.045\n", "epoch: 141, batch: 2700 // loss: 0.042\n", "epoch: 141, batch: 2800 // loss: 0.046\n", "epoch: 141, batch: 2900 // loss: 0.042\n", "epoch: 141, batch: 3000 // loss: 0.045\n", "epoch: 141, batch: 3100 // loss: 0.043\n", "epoch: 141, batch: 3200 // loss: 0.039\n", "epoch: 141, batch: 3300 // loss: 0.038\n", "epoch: 141, batch: 3400 // loss: 0.044\n", "epoch: 141, batch: 3500 // loss: 0.035\n", "epoch: 141, batch: 3600 // loss: 0.043\n", "epoch: 141, batch: 3700 // loss: 0.043\n", "\n", "epoch: 142, batch: 0 // loss: 0.053\n", "epoch: 142, batch: 100 // loss: 0.046\n", "epoch: 142, batch: 200 // loss: 0.043\n", "epoch: 142, batch: 300 // loss: 0.049\n", "epoch: 142, batch: 400 // loss: 0.046\n", "epoch: 142, batch: 500 // loss: 0.040\n", "epoch: 142, batch: 600 // loss: 0.040\n", "epoch: 142, batch: 700 // loss: 0.044\n", "epoch: 142, batch: 800 // loss: 0.042\n", "epoch: 142, batch: 900 // loss: 0.049\n", "epoch: 142, batch: 1000 // loss: 0.046\n", "epoch: 142, batch: 1100 // loss: 0.042\n", "epoch: 142, batch: 1200 // loss: 0.044\n", "epoch: 142, batch: 1300 // loss: 0.046\n", "epoch: 142, batch: 1400 // loss: 0.043\n", "epoch: 142, batch: 1500 // loss: 0.048\n", "epoch: 142, batch: 1600 // loss: 0.052\n", "epoch: 142, batch: 1700 // loss: 0.045\n", "epoch: 142, batch: 1800 // loss: 0.053\n", "epoch: 142, batch: 1900 // loss: 0.045\n", "epoch: 142, batch: 2000 // loss: 0.047\n", "epoch: 142, batch: 2100 // loss: 0.046\n", "epoch: 142, batch: 2200 // loss: 0.050\n", "epoch: 142, batch: 2300 // loss: 0.049\n", "epoch: 142, batch: 2400 // loss: 0.042\n", "epoch: 142, batch: 2500 // loss: 0.042\n", "epoch: 142, batch: 2600 // loss: 0.045\n", "epoch: 142, batch: 2700 // loss: 0.042\n", "epoch: 142, batch: 2800 // loss: 0.046\n", "epoch: 142, batch: 2900 // loss: 0.042\n", "epoch: 142, batch: 3000 // loss: 0.045\n", "epoch: 142, batch: 3100 // loss: 0.043\n", "epoch: 142, batch: 3200 // loss: 0.039\n", "epoch: 142, batch: 3300 // loss: 0.038\n", "epoch: 142, batch: 3400 // loss: 0.044\n", "epoch: 142, batch: 3500 // loss: 0.035\n", "epoch: 142, batch: 3600 // loss: 0.043\n", "epoch: 142, batch: 3700 // loss: 0.043\n", "\n", "epoch: 143, batch: 0 // loss: 0.053\n", "epoch: 143, batch: 100 // loss: 0.046\n", "epoch: 143, batch: 200 // loss: 0.043\n", "epoch: 143, batch: 300 // loss: 0.049\n", "epoch: 143, batch: 400 // loss: 0.046\n", "epoch: 143, batch: 500 // loss: 0.040\n", "epoch: 143, batch: 600 // loss: 0.040\n", "epoch: 143, batch: 700 // loss: 0.044\n", "epoch: 143, batch: 800 // loss: 0.042\n", "epoch: 143, batch: 900 // loss: 0.049\n", "epoch: 143, batch: 1000 // loss: 0.046\n", "epoch: 143, batch: 1100 // loss: 0.042\n", "epoch: 143, batch: 1200 // loss: 0.044\n", "epoch: 143, batch: 1300 // loss: 0.046\n", "epoch: 143, batch: 1400 // loss: 0.043\n", "epoch: 143, batch: 1500 // loss: 0.048\n", "epoch: 143, batch: 1600 // loss: 0.052\n", "epoch: 143, batch: 1700 // loss: 0.045\n", "epoch: 143, batch: 1800 // loss: 0.053\n", "epoch: 143, batch: 1900 // loss: 0.045\n", "epoch: 143, batch: 2000 // loss: 0.047\n", "epoch: 143, batch: 2100 // loss: 0.046\n", "epoch: 143, batch: 2200 // loss: 0.050\n", "epoch: 143, batch: 2300 // loss: 0.049\n", "epoch: 143, batch: 2400 // loss: 0.042\n", "epoch: 143, batch: 2500 // loss: 0.042\n", "epoch: 143, batch: 2600 // loss: 0.045\n", "epoch: 143, batch: 2700 // loss: 0.042\n", "epoch: 143, batch: 2800 // loss: 0.046\n", "epoch: 143, batch: 2900 // loss: 0.042\n", "epoch: 143, batch: 3000 // loss: 0.045\n", "epoch: 143, batch: 3100 // loss: 0.043\n", "epoch: 143, batch: 3200 // loss: 0.039\n", "epoch: 143, batch: 3300 // loss: 0.038\n", "epoch: 143, batch: 3400 // loss: 0.044\n", "epoch: 143, batch: 3500 // loss: 0.035\n", "epoch: 143, batch: 3600 // loss: 0.043\n", "epoch: 143, batch: 3700 // loss: 0.043\n", "\n", "epoch: 144, batch: 0 // loss: 0.053\n", "epoch: 144, batch: 100 // loss: 0.046\n", "epoch: 144, batch: 200 // loss: 0.043\n", "epoch: 144, batch: 300 // loss: 0.049\n", "epoch: 144, batch: 400 // loss: 0.046\n", "epoch: 144, batch: 500 // loss: 0.040\n", "epoch: 144, batch: 600 // loss: 0.040\n", "epoch: 144, batch: 700 // loss: 0.044\n", "epoch: 144, batch: 800 // loss: 0.042\n", "epoch: 144, batch: 900 // loss: 0.049\n", "epoch: 144, batch: 1000 // loss: 0.046\n", "epoch: 144, batch: 1100 // loss: 0.042\n", "epoch: 144, batch: 1200 // loss: 0.044\n", "epoch: 144, batch: 1300 // loss: 0.046\n", "epoch: 144, batch: 1400 // loss: 0.043\n", "epoch: 144, batch: 1500 // loss: 0.048\n", "epoch: 144, batch: 1600 // loss: 0.052\n", "epoch: 144, batch: 1700 // loss: 0.045\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 144, batch: 1800 // loss: 0.053\n", "epoch: 144, batch: 1900 // loss: 0.045\n", "epoch: 144, batch: 2000 // loss: 0.047\n", "epoch: 144, batch: 2100 // loss: 0.046\n", "epoch: 144, batch: 2200 // loss: 0.050\n", "epoch: 144, batch: 2300 // loss: 0.049\n", "epoch: 144, batch: 2400 // loss: 0.042\n", "epoch: 144, batch: 2500 // loss: 0.042\n", "epoch: 144, batch: 2600 // loss: 0.045\n", "epoch: 144, batch: 2700 // loss: 0.042\n", "epoch: 144, batch: 2800 // loss: 0.046\n", "epoch: 144, batch: 2900 // loss: 0.042\n", "epoch: 144, batch: 3000 // loss: 0.045\n", "epoch: 144, batch: 3100 // loss: 0.043\n", "epoch: 144, batch: 3200 // loss: 0.039\n", "epoch: 144, batch: 3300 // loss: 0.038\n", "epoch: 144, batch: 3400 // loss: 0.044\n", "epoch: 144, batch: 3500 // loss: 0.035\n", "epoch: 144, batch: 3600 // loss: 0.043\n", "epoch: 144, batch: 3700 // loss: 0.043\n", "\n", "epoch: 145, batch: 0 // loss: 0.053\n", "epoch: 145, batch: 100 // loss: 0.046\n", "epoch: 145, batch: 200 // loss: 0.043\n", "epoch: 145, batch: 300 // loss: 0.049\n", "epoch: 145, batch: 400 // loss: 0.046\n", "epoch: 145, batch: 500 // loss: 0.040\n", "epoch: 145, batch: 600 // loss: 0.040\n", "epoch: 145, batch: 700 // loss: 0.044\n", "epoch: 145, batch: 800 // loss: 0.042\n", "epoch: 145, batch: 900 // loss: 0.049\n", "epoch: 145, batch: 1000 // loss: 0.046\n", "epoch: 145, batch: 1100 // loss: 0.042\n", "epoch: 145, batch: 1200 // loss: 0.044\n", "epoch: 145, batch: 1300 // loss: 0.046\n", "epoch: 145, batch: 1400 // loss: 0.043\n", "epoch: 145, batch: 1500 // loss: 0.048\n", "epoch: 145, batch: 1600 // loss: 0.052\n", "epoch: 145, batch: 1700 // loss: 0.045\n", "epoch: 145, batch: 1800 // loss: 0.053\n", "epoch: 145, batch: 1900 // loss: 0.045\n", "epoch: 145, batch: 2000 // loss: 0.047\n", "epoch: 145, batch: 2100 // loss: 0.046\n", "epoch: 145, batch: 2200 // loss: 0.050\n", "epoch: 145, batch: 2300 // loss: 0.049\n", "epoch: 145, batch: 2400 // loss: 0.042\n", "epoch: 145, batch: 2500 // loss: 0.042\n", "epoch: 145, batch: 2600 // loss: 0.045\n", "epoch: 145, batch: 2700 // loss: 0.042\n", "epoch: 145, batch: 2800 // loss: 0.046\n", "epoch: 145, batch: 2900 // loss: 0.042\n", "epoch: 145, batch: 3000 // loss: 0.045\n", "epoch: 145, batch: 3100 // loss: 0.043\n", "epoch: 145, batch: 3200 // loss: 0.039\n", "epoch: 145, batch: 3300 // loss: 0.038\n", "epoch: 145, batch: 3400 // loss: 0.044\n", "epoch: 145, batch: 3500 // loss: 0.035\n", "epoch: 145, batch: 3600 // loss: 0.043\n", "epoch: 145, batch: 3700 // loss: 0.043\n", "\n", "epoch: 146, batch: 0 // loss: 0.053\n", "epoch: 146, batch: 100 // loss: 0.046\n", "epoch: 146, batch: 200 // loss: 0.043\n", "epoch: 146, batch: 300 // loss: 0.049\n", "epoch: 146, batch: 400 // loss: 0.046\n", "epoch: 146, batch: 500 // loss: 0.040\n", "epoch: 146, batch: 600 // loss: 0.040\n", "epoch: 146, batch: 700 // loss: 0.044\n", "epoch: 146, batch: 800 // loss: 0.042\n", "epoch: 146, batch: 900 // loss: 0.049\n", "epoch: 146, batch: 1000 // loss: 0.046\n", "epoch: 146, batch: 1100 // loss: 0.042\n", "epoch: 146, batch: 1200 // loss: 0.044\n", "epoch: 146, batch: 1300 // loss: 0.046\n", "epoch: 146, batch: 1400 // loss: 0.043\n", "epoch: 146, batch: 1500 // loss: 0.048\n", "epoch: 146, batch: 1600 // loss: 0.052\n", "epoch: 146, batch: 1700 // loss: 0.045\n", "epoch: 146, batch: 1800 // loss: 0.053\n", "epoch: 146, batch: 1900 // loss: 0.045\n", "epoch: 146, batch: 2000 // loss: 0.047\n", "epoch: 146, batch: 2100 // loss: 0.046\n", "epoch: 146, batch: 2200 // loss: 0.050\n", "epoch: 146, batch: 2300 // loss: 0.049\n", "epoch: 146, batch: 2400 // loss: 0.042\n", "epoch: 146, batch: 2500 // loss: 0.042\n", "epoch: 146, batch: 2600 // loss: 0.045\n", "epoch: 146, batch: 2700 // loss: 0.042\n", "epoch: 146, batch: 2800 // loss: 0.046\n", "epoch: 146, batch: 2900 // loss: 0.042\n", "epoch: 146, batch: 3000 // loss: 0.045\n", "epoch: 146, batch: 3100 // loss: 0.043\n", "epoch: 146, batch: 3200 // loss: 0.039\n", "epoch: 146, batch: 3300 // loss: 0.038\n", "epoch: 146, batch: 3400 // loss: 0.044\n", "epoch: 146, batch: 3500 // loss: 0.035\n", "epoch: 146, batch: 3600 // loss: 0.043\n", "epoch: 146, batch: 3700 // loss: 0.043\n", "\n", "epoch: 147, batch: 0 // loss: 0.053\n", "epoch: 147, batch: 100 // loss: 0.046\n", "epoch: 147, batch: 200 // loss: 0.043\n", "epoch: 147, batch: 300 // loss: 0.049\n", "epoch: 147, batch: 400 // loss: 0.046\n", "epoch: 147, batch: 500 // loss: 0.040\n", "epoch: 147, batch: 600 // loss: 0.040\n", "epoch: 147, batch: 700 // loss: 0.044\n", "epoch: 147, batch: 800 // loss: 0.042\n", "epoch: 147, batch: 900 // loss: 0.049\n", "epoch: 147, batch: 1000 // loss: 0.046\n", "epoch: 147, batch: 1100 // loss: 0.042\n", "epoch: 147, batch: 1200 // loss: 0.044\n", "epoch: 147, batch: 1300 // loss: 0.046\n", "epoch: 147, batch: 1400 // loss: 0.043\n", "epoch: 147, batch: 1500 // loss: 0.048\n", "epoch: 147, batch: 1600 // loss: 0.052\n", "epoch: 147, batch: 1700 // loss: 0.045\n", "epoch: 147, batch: 1800 // loss: 0.053\n", "epoch: 147, batch: 1900 // loss: 0.045\n", "epoch: 147, batch: 2000 // loss: 0.047\n", "epoch: 147, batch: 2100 // loss: 0.046\n", "epoch: 147, batch: 2200 // loss: 0.050\n", "epoch: 147, batch: 2300 // loss: 0.049\n", "epoch: 147, batch: 2400 // loss: 0.042\n", "epoch: 147, batch: 2500 // loss: 0.042\n", "epoch: 147, batch: 2600 // loss: 0.045\n", "epoch: 147, batch: 2700 // loss: 0.042\n", "epoch: 147, batch: 2800 // loss: 0.046\n", "epoch: 147, batch: 2900 // loss: 0.042\n", "epoch: 147, batch: 3000 // loss: 0.045\n", "epoch: 147, batch: 3100 // loss: 0.043\n", "epoch: 147, batch: 3200 // loss: 0.039\n", "epoch: 147, batch: 3300 // loss: 0.038\n", "epoch: 147, batch: 3400 // loss: 0.044\n", "epoch: 147, batch: 3500 // loss: 0.035\n", "epoch: 147, batch: 3600 // loss: 0.043\n", "epoch: 147, batch: 3700 // loss: 0.043\n", "\n", "epoch: 148, batch: 0 // loss: 0.053\n", "epoch: 148, batch: 100 // loss: 0.046\n", "epoch: 148, batch: 200 // loss: 0.043\n", "epoch: 148, batch: 300 // loss: 0.049\n", "epoch: 148, batch: 400 // loss: 0.046\n", "epoch: 148, batch: 500 // loss: 0.040\n", "epoch: 148, batch: 600 // loss: 0.040\n", "epoch: 148, batch: 700 // loss: 0.044\n", "epoch: 148, batch: 800 // loss: 0.042\n", "epoch: 148, batch: 900 // loss: 0.049\n", "epoch: 148, batch: 1000 // loss: 0.046\n", "epoch: 148, batch: 1100 // loss: 0.042\n", "epoch: 148, batch: 1200 // loss: 0.044\n", "epoch: 148, batch: 1300 // loss: 0.046\n", "epoch: 148, batch: 1400 // loss: 0.043\n", "epoch: 148, batch: 1500 // loss: 0.048\n", "epoch: 148, batch: 1600 // loss: 0.052\n", "epoch: 148, batch: 1700 // loss: 0.045\n", "epoch: 148, batch: 1800 // loss: 0.053\n", "epoch: 148, batch: 1900 // loss: 0.045\n", "epoch: 148, batch: 2000 // loss: 0.047\n", "epoch: 148, batch: 2100 // loss: 0.046\n", "epoch: 148, batch: 2200 // loss: 0.050\n", "epoch: 148, batch: 2300 // loss: 0.049\n", "epoch: 148, batch: 2400 // loss: 0.042\n", "epoch: 148, batch: 2500 // loss: 0.042\n", "epoch: 148, batch: 2600 // loss: 0.045\n", "epoch: 148, batch: 2700 // loss: 0.042\n", "epoch: 148, batch: 2800 // loss: 0.046\n", "epoch: 148, batch: 2900 // loss: 0.042\n", "epoch: 148, batch: 3000 // loss: 0.045\n", "epoch: 148, batch: 3100 // loss: 0.043\n", "epoch: 148, batch: 3200 // loss: 0.039\n", "epoch: 148, batch: 3300 // loss: 0.038\n", "epoch: 148, batch: 3400 // loss: 0.044\n", "epoch: 148, batch: 3500 // loss: 0.035\n", "epoch: 148, batch: 3600 // loss: 0.043\n", "epoch: 148, batch: 3700 // loss: 0.043\n", "\n", "epoch: 149, batch: 0 // loss: 0.053\n", "epoch: 149, batch: 100 // loss: 0.046\n", "epoch: 149, batch: 200 // loss: 0.043\n", "epoch: 149, batch: 300 // loss: 0.049\n", "epoch: 149, batch: 400 // loss: 0.046\n", "epoch: 149, batch: 500 // loss: 0.040\n", "epoch: 149, batch: 600 // loss: 0.040\n", "epoch: 149, batch: 700 // loss: 0.044\n", "epoch: 149, batch: 800 // loss: 0.042\n", "epoch: 149, batch: 900 // loss: 0.049\n", "epoch: 149, batch: 1000 // loss: 0.046\n", "epoch: 149, batch: 1100 // loss: 0.042\n", "epoch: 149, batch: 1200 // loss: 0.044\n", "epoch: 149, batch: 1300 // loss: 0.046\n", "epoch: 149, batch: 1400 // loss: 0.043\n", "epoch: 149, batch: 1500 // loss: 0.048\n", "epoch: 149, batch: 1600 // loss: 0.052\n", "epoch: 149, batch: 1700 // loss: 0.045\n", "epoch: 149, batch: 1800 // loss: 0.053\n", "epoch: 149, batch: 1900 // loss: 0.045\n", "epoch: 149, batch: 2000 // loss: 0.047\n", "epoch: 149, batch: 2100 // loss: 0.046\n", "epoch: 149, batch: 2200 // loss: 0.050\n", "epoch: 149, batch: 2300 // loss: 0.049\n", "epoch: 149, batch: 2400 // loss: 0.042\n", "epoch: 149, batch: 2500 // loss: 0.042\n", "epoch: 149, batch: 2600 // loss: 0.045\n", "epoch: 149, batch: 2700 // loss: 0.042\n", "epoch: 149, batch: 2800 // loss: 0.046\n", "epoch: 149, batch: 2900 // loss: 0.042\n", "epoch: 149, batch: 3000 // loss: 0.045\n", "epoch: 149, batch: 3100 // loss: 0.043\n", "epoch: 149, batch: 3200 // loss: 0.039\n", "epoch: 149, batch: 3300 // loss: 0.038\n", "epoch: 149, batch: 3400 // loss: 0.044\n", "epoch: 149, batch: 3500 // loss: 0.035\n", "epoch: 149, batch: 3600 // loss: 0.043\n", "epoch: 149, batch: 3700 // loss: 0.043\n", "\n", "epoch: 150, batch: 0 // loss: 0.053\n", "epoch: 150, batch: 100 // loss: 0.046\n", "epoch: 150, batch: 200 // loss: 0.043\n", "epoch: 150, batch: 300 // loss: 0.049\n", "epoch: 150, batch: 400 // loss: 0.046\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 150, batch: 500 // loss: 0.040\n", "epoch: 150, batch: 600 // loss: 0.040\n", "epoch: 150, batch: 700 // loss: 0.044\n", "epoch: 150, batch: 800 // loss: 0.042\n", "epoch: 150, batch: 900 // loss: 0.049\n", "epoch: 150, batch: 1000 // loss: 0.046\n", "epoch: 150, batch: 1100 // loss: 0.042\n", "epoch: 150, batch: 1200 // loss: 0.044\n", "epoch: 150, batch: 1300 // loss: 0.046\n", "epoch: 150, batch: 1400 // loss: 0.043\n", "epoch: 150, batch: 1500 // loss: 0.048\n", "epoch: 150, batch: 1600 // loss: 0.052\n", "epoch: 150, batch: 1700 // loss: 0.045\n", "epoch: 150, batch: 1800 // loss: 0.053\n", "epoch: 150, batch: 1900 // loss: 0.045\n", "epoch: 150, batch: 2000 // loss: 0.047\n", "epoch: 150, batch: 2100 // loss: 0.046\n", "epoch: 150, batch: 2200 // loss: 0.050\n", "epoch: 150, batch: 2300 // loss: 0.049\n", "epoch: 150, batch: 2400 // loss: 0.042\n", "epoch: 150, batch: 2500 // loss: 0.042\n", "epoch: 150, batch: 2600 // loss: 0.045\n", "epoch: 150, batch: 2700 // loss: 0.042\n", "epoch: 150, batch: 2800 // loss: 0.046\n", "epoch: 150, batch: 2900 // loss: 0.042\n", "epoch: 150, batch: 3000 // loss: 0.045\n", "epoch: 150, batch: 3100 // loss: 0.043\n", "epoch: 150, batch: 3200 // loss: 0.039\n", "epoch: 150, batch: 3300 // loss: 0.038\n", "epoch: 150, batch: 3400 // loss: 0.044\n", "epoch: 150, batch: 3500 // loss: 0.035\n", "epoch: 150, batch: 3600 // loss: 0.043\n", "epoch: 150, batch: 3700 // loss: 0.043\n", "\n", "epoch: 151, batch: 0 // loss: 0.053\n", "epoch: 151, batch: 100 // loss: 0.046\n", "epoch: 151, batch: 200 // loss: 0.043\n", "epoch: 151, batch: 300 // loss: 0.049\n", "epoch: 151, batch: 400 // loss: 0.046\n", "epoch: 151, batch: 500 // loss: 0.040\n", "epoch: 151, batch: 600 // loss: 0.040\n", "epoch: 151, batch: 700 // loss: 0.044\n", "epoch: 151, batch: 800 // loss: 0.042\n", "epoch: 151, batch: 900 // loss: 0.049\n", "epoch: 151, batch: 1000 // loss: 0.046\n", "epoch: 151, batch: 1100 // loss: 0.042\n", "epoch: 151, batch: 1200 // loss: 0.044\n", "epoch: 151, batch: 1300 // loss: 0.046\n", "epoch: 151, batch: 1400 // loss: 0.043\n", "epoch: 151, batch: 1500 // loss: 0.048\n", "epoch: 151, batch: 1600 // loss: 0.052\n", "epoch: 151, batch: 1700 // loss: 0.045\n", "epoch: 151, batch: 1800 // loss: 0.053\n", "epoch: 151, batch: 1900 // loss: 0.045\n", "epoch: 151, batch: 2000 // loss: 0.047\n", "epoch: 151, batch: 2100 // loss: 0.046\n", "epoch: 151, batch: 2200 // loss: 0.050\n", "epoch: 151, batch: 2300 // loss: 0.049\n", "epoch: 151, batch: 2400 // loss: 0.042\n", "epoch: 151, batch: 2500 // loss: 0.042\n", "epoch: 151, batch: 2600 // loss: 0.045\n", "epoch: 151, batch: 2700 // loss: 0.042\n", "epoch: 151, batch: 2800 // loss: 0.046\n", "epoch: 151, batch: 2900 // loss: 0.042\n", "epoch: 151, batch: 3000 // loss: 0.045\n", "epoch: 151, batch: 3100 // loss: 0.043\n", "epoch: 151, batch: 3200 // loss: 0.039\n", "epoch: 151, batch: 3300 // loss: 0.038\n", "epoch: 151, batch: 3400 // loss: 0.044\n", "epoch: 151, batch: 3500 // loss: 0.035\n", "epoch: 151, batch: 3600 // loss: 0.043\n", "epoch: 151, batch: 3700 // loss: 0.043\n", "\n", "epoch: 152, batch: 0 // loss: 0.053\n", "epoch: 152, batch: 100 // loss: 0.046\n", "epoch: 152, batch: 200 // loss: 0.043\n", "epoch: 152, batch: 300 // loss: 0.049\n", "epoch: 152, batch: 400 // loss: 0.046\n", "epoch: 152, batch: 500 // loss: 0.040\n", "epoch: 152, batch: 600 // loss: 0.040\n", "epoch: 152, batch: 700 // loss: 0.044\n", "epoch: 152, batch: 800 // loss: 0.042\n", "epoch: 152, batch: 900 // loss: 0.049\n", "epoch: 152, batch: 1000 // loss: 0.046\n", "epoch: 152, batch: 1100 // loss: 0.042\n", "epoch: 152, batch: 1200 // loss: 0.044\n", "epoch: 152, batch: 1300 // loss: 0.046\n", "epoch: 152, batch: 1400 // loss: 0.043\n", "epoch: 152, batch: 1500 // loss: 0.048\n", "epoch: 152, batch: 1600 // loss: 0.052\n", "epoch: 152, batch: 1700 // loss: 0.045\n", "epoch: 152, batch: 1800 // loss: 0.053\n", "epoch: 152, batch: 1900 // loss: 0.045\n", "epoch: 152, batch: 2000 // loss: 0.047\n", "epoch: 152, batch: 2100 // loss: 0.046\n", "epoch: 152, batch: 2200 // loss: 0.050\n", "epoch: 152, batch: 2300 // loss: 0.049\n", "epoch: 152, batch: 2400 // loss: 0.042\n", "epoch: 152, batch: 2500 // loss: 0.042\n", "epoch: 152, batch: 2600 // loss: 0.045\n", "epoch: 152, batch: 2700 // loss: 0.042\n", "epoch: 152, batch: 2800 // loss: 0.046\n", "epoch: 152, batch: 2900 // loss: 0.042\n", "epoch: 152, batch: 3000 // loss: 0.045\n", "epoch: 152, batch: 3100 // loss: 0.043\n", "epoch: 152, batch: 3200 // loss: 0.039\n", "epoch: 152, batch: 3300 // loss: 0.038\n", "epoch: 152, batch: 3400 // loss: 0.044\n", "epoch: 152, batch: 3500 // loss: 0.035\n", "epoch: 152, batch: 3600 // loss: 0.043\n", "epoch: 152, batch: 3700 // loss: 0.043\n", "\n", "epoch: 153, batch: 0 // loss: 0.053\n", "epoch: 153, batch: 100 // loss: 0.046\n", "epoch: 153, batch: 200 // loss: 0.043\n", "epoch: 153, batch: 300 // loss: 0.049\n", "epoch: 153, batch: 400 // loss: 0.046\n", "epoch: 153, batch: 500 // loss: 0.040\n", "epoch: 153, batch: 600 // loss: 0.040\n", "epoch: 153, batch: 700 // loss: 0.044\n", "epoch: 153, batch: 800 // loss: 0.042\n", "epoch: 153, batch: 900 // loss: 0.049\n", "epoch: 153, batch: 1000 // loss: 0.046\n", "epoch: 153, batch: 1100 // loss: 0.042\n", "epoch: 153, batch: 1200 // loss: 0.044\n", "epoch: 153, batch: 1300 // loss: 0.046\n", "epoch: 153, batch: 1400 // loss: 0.043\n", "epoch: 153, batch: 1500 // loss: 0.048\n", "epoch: 153, batch: 1600 // loss: 0.052\n", "epoch: 153, batch: 1700 // loss: 0.045\n", "epoch: 153, batch: 1800 // loss: 0.053\n", "epoch: 153, batch: 1900 // loss: 0.045\n", "epoch: 153, batch: 2000 // loss: 0.047\n", "epoch: 153, batch: 2100 // loss: 0.046\n", "epoch: 153, batch: 2200 // loss: 0.050\n", "epoch: 153, batch: 2300 // loss: 0.049\n", "epoch: 153, batch: 2400 // loss: 0.042\n", "epoch: 153, batch: 2500 // loss: 0.042\n", "epoch: 153, batch: 2600 // loss: 0.045\n", "epoch: 153, batch: 2700 // loss: 0.042\n", "epoch: 153, batch: 2800 // loss: 0.046\n", "epoch: 153, batch: 2900 // loss: 0.042\n", "epoch: 153, batch: 3000 // loss: 0.045\n", "epoch: 153, batch: 3100 // loss: 0.043\n", "epoch: 153, batch: 3200 // loss: 0.039\n", "epoch: 153, batch: 3300 // loss: 0.038\n", "epoch: 153, batch: 3400 // loss: 0.044\n", "epoch: 153, batch: 3500 // loss: 0.035\n", "epoch: 153, batch: 3600 // loss: 0.043\n", "epoch: 153, batch: 3700 // loss: 0.043\n", "\n", "epoch: 154, batch: 0 // loss: 0.053\n", "epoch: 154, batch: 100 // loss: 0.046\n", "epoch: 154, batch: 200 // loss: 0.043\n", "epoch: 154, batch: 300 // loss: 0.049\n", "epoch: 154, batch: 400 // loss: 0.046\n", "epoch: 154, batch: 500 // loss: 0.040\n", "epoch: 154, batch: 600 // loss: 0.040\n", "epoch: 154, batch: 700 // loss: 0.044\n", "epoch: 154, batch: 800 // loss: 0.042\n", "epoch: 154, batch: 900 // loss: 0.049\n", "epoch: 154, batch: 1000 // loss: 0.046\n", "epoch: 154, batch: 1100 // loss: 0.042\n", "epoch: 154, batch: 1200 // loss: 0.044\n", "epoch: 154, batch: 1300 // loss: 0.046\n", "epoch: 154, batch: 1400 // loss: 0.043\n", "epoch: 154, batch: 1500 // loss: 0.048\n", "epoch: 154, batch: 1600 // loss: 0.052\n", "epoch: 154, batch: 1700 // loss: 0.045\n", "epoch: 154, batch: 1800 // loss: 0.053\n", "epoch: 154, batch: 1900 // loss: 0.045\n", "epoch: 154, batch: 2000 // loss: 0.047\n", "epoch: 154, batch: 2100 // loss: 0.046\n", "epoch: 154, batch: 2200 // loss: 0.050\n", "epoch: 154, batch: 2300 // loss: 0.049\n", "epoch: 154, batch: 2400 // loss: 0.042\n", "epoch: 154, batch: 2500 // loss: 0.042\n", "epoch: 154, batch: 2600 // loss: 0.045\n", "epoch: 154, batch: 2700 // loss: 0.042\n", "epoch: 154, batch: 2800 // loss: 0.046\n", "epoch: 154, batch: 2900 // loss: 0.042\n", "epoch: 154, batch: 3000 // loss: 0.045\n", "epoch: 154, batch: 3100 // loss: 0.043\n", "epoch: 154, batch: 3200 // loss: 0.039\n", "epoch: 154, batch: 3300 // loss: 0.038\n", "epoch: 154, batch: 3400 // loss: 0.044\n", "epoch: 154, batch: 3500 // loss: 0.035\n", "epoch: 154, batch: 3600 // loss: 0.043\n", "epoch: 154, batch: 3700 // loss: 0.043\n", "\n", "epoch: 155, batch: 0 // loss: 0.053\n", "epoch: 155, batch: 100 // loss: 0.046\n", "epoch: 155, batch: 200 // loss: 0.043\n", "epoch: 155, batch: 300 // loss: 0.049\n", "epoch: 155, batch: 400 // loss: 0.046\n", "epoch: 155, batch: 500 // loss: 0.040\n", "epoch: 155, batch: 600 // loss: 0.040\n", "epoch: 155, batch: 700 // loss: 0.044\n", "epoch: 155, batch: 800 // loss: 0.042\n", "epoch: 155, batch: 900 // loss: 0.049\n", "epoch: 155, batch: 1000 // loss: 0.046\n", "epoch: 155, batch: 1100 // loss: 0.042\n", "epoch: 155, batch: 1200 // loss: 0.044\n", "epoch: 155, batch: 1300 // loss: 0.046\n", "epoch: 155, batch: 1400 // loss: 0.043\n", "epoch: 155, batch: 1500 // loss: 0.048\n", "epoch: 155, batch: 1600 // loss: 0.052\n", "epoch: 155, batch: 1700 // loss: 0.045\n", "epoch: 155, batch: 1800 // loss: 0.053\n", "epoch: 155, batch: 1900 // loss: 0.045\n", "epoch: 155, batch: 2000 // loss: 0.047\n", "epoch: 155, batch: 2100 // loss: 0.046\n", "epoch: 155, batch: 2200 // loss: 0.050\n", "epoch: 155, batch: 2300 // loss: 0.049\n", "epoch: 155, batch: 2400 // loss: 0.042\n", "epoch: 155, batch: 2500 // loss: 0.042\n", "epoch: 155, batch: 2600 // loss: 0.045\n", "epoch: 155, batch: 2700 // loss: 0.042\n", "epoch: 155, batch: 2800 // loss: 0.046\n", "epoch: 155, batch: 2900 // loss: 0.042\n", "epoch: 155, batch: 3000 // loss: 0.045\n", "epoch: 155, batch: 3100 // loss: 0.043\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 155, batch: 3200 // loss: 0.039\n", "epoch: 155, batch: 3300 // loss: 0.038\n", "epoch: 155, batch: 3400 // loss: 0.044\n", "epoch: 155, batch: 3500 // loss: 0.035\n", "epoch: 155, batch: 3600 // loss: 0.043\n", "epoch: 155, batch: 3700 // loss: 0.043\n", "\n", "epoch: 156, batch: 0 // loss: 0.053\n", "epoch: 156, batch: 100 // loss: 0.046\n", "epoch: 156, batch: 200 // loss: 0.043\n", "epoch: 156, batch: 300 // loss: 0.049\n", "epoch: 156, batch: 400 // loss: 0.046\n", "epoch: 156, batch: 500 // loss: 0.040\n", "epoch: 156, batch: 600 // loss: 0.040\n", "epoch: 156, batch: 700 // loss: 0.044\n", "epoch: 156, batch: 800 // loss: 0.042\n", "epoch: 156, batch: 900 // loss: 0.049\n", "epoch: 156, batch: 1000 // loss: 0.046\n", "epoch: 156, batch: 1100 // loss: 0.042\n", "epoch: 156, batch: 1200 // loss: 0.044\n", "epoch: 156, batch: 1300 // loss: 0.046\n", "epoch: 156, batch: 1400 // loss: 0.043\n", "epoch: 156, batch: 1500 // loss: 0.048\n", "epoch: 156, batch: 1600 // loss: 0.052\n", "epoch: 156, batch: 1700 // loss: 0.045\n", "epoch: 156, batch: 1800 // loss: 0.053\n", "epoch: 156, batch: 1900 // loss: 0.045\n", "epoch: 156, batch: 2000 // loss: 0.047\n", "epoch: 156, batch: 2100 // loss: 0.046\n", "epoch: 156, batch: 2200 // loss: 0.050\n", "epoch: 156, batch: 2300 // loss: 0.049\n", "epoch: 156, batch: 2400 // loss: 0.042\n", "epoch: 156, batch: 2500 // loss: 0.042\n", "epoch: 156, batch: 2600 // loss: 0.045\n", "epoch: 156, batch: 2700 // loss: 0.042\n", "epoch: 156, batch: 2800 // loss: 0.046\n", "epoch: 156, batch: 2900 // loss: 0.042\n", "epoch: 156, batch: 3000 // loss: 0.045\n", "epoch: 156, batch: 3100 // loss: 0.043\n", "epoch: 156, batch: 3200 // loss: 0.039\n", "epoch: 156, batch: 3300 // loss: 0.038\n", "epoch: 156, batch: 3400 // loss: 0.044\n", "epoch: 156, batch: 3500 // loss: 0.035\n", "epoch: 156, batch: 3600 // loss: 0.043\n", "epoch: 156, batch: 3700 // loss: 0.043\n", "\n", "epoch: 157, batch: 0 // loss: 0.053\n", "epoch: 157, batch: 100 // loss: 0.046\n", "epoch: 157, batch: 200 // loss: 0.043\n", "epoch: 157, batch: 300 // loss: 0.049\n", "epoch: 157, batch: 400 // loss: 0.046\n", "epoch: 157, batch: 500 // loss: 0.040\n", "epoch: 157, batch: 600 // loss: 0.040\n", "epoch: 157, batch: 700 // loss: 0.044\n", "epoch: 157, batch: 800 // loss: 0.042\n", "epoch: 157, batch: 900 // loss: 0.049\n", "epoch: 157, batch: 1000 // loss: 0.046\n", "epoch: 157, batch: 1100 // loss: 0.042\n", "epoch: 157, batch: 1200 // loss: 0.044\n", "epoch: 157, batch: 1300 // loss: 0.046\n", "epoch: 157, batch: 1400 // loss: 0.043\n", "epoch: 157, batch: 1500 // loss: 0.048\n", "epoch: 157, batch: 1600 // loss: 0.052\n", "epoch: 157, batch: 1700 // loss: 0.045\n", "epoch: 157, batch: 1800 // loss: 0.053\n", "epoch: 157, batch: 1900 // loss: 0.045\n", "epoch: 157, batch: 2000 // loss: 0.047\n", "epoch: 157, batch: 2100 // loss: 0.046\n", "epoch: 157, batch: 2200 // loss: 0.050\n", "epoch: 157, batch: 2300 // loss: 0.049\n", "epoch: 157, batch: 2400 // loss: 0.042\n", "epoch: 157, batch: 2500 // loss: 0.042\n", "epoch: 157, batch: 2600 // loss: 0.045\n", "epoch: 157, batch: 2700 // loss: 0.042\n", "epoch: 157, batch: 2800 // loss: 0.046\n", "epoch: 157, batch: 2900 // loss: 0.042\n", "epoch: 157, batch: 3000 // loss: 0.045\n", "epoch: 157, batch: 3100 // loss: 0.043\n", "epoch: 157, batch: 3200 // loss: 0.039\n", "epoch: 157, batch: 3300 // loss: 0.038\n", "epoch: 157, batch: 3400 // loss: 0.044\n", "epoch: 157, batch: 3500 // loss: 0.035\n", "epoch: 157, batch: 3600 // loss: 0.043\n", "epoch: 157, batch: 3700 // loss: 0.043\n", "\n", "epoch: 158, batch: 0 // loss: 0.053\n", "epoch: 158, batch: 100 // loss: 0.046\n", "epoch: 158, batch: 200 // loss: 0.043\n", "epoch: 158, batch: 300 // loss: 0.049\n", "epoch: 158, batch: 400 // loss: 0.046\n", "epoch: 158, batch: 500 // loss: 0.040\n", "epoch: 158, batch: 600 // loss: 0.040\n", "epoch: 158, batch: 700 // loss: 0.044\n", "epoch: 158, batch: 800 // loss: 0.042\n", "epoch: 158, batch: 900 // loss: 0.049\n", "epoch: 158, batch: 1000 // loss: 0.046\n", "epoch: 158, batch: 1100 // loss: 0.042\n", "epoch: 158, batch: 1200 // loss: 0.044\n", "epoch: 158, batch: 1300 // loss: 0.046\n", "epoch: 158, batch: 1400 // loss: 0.043\n", "epoch: 158, batch: 1500 // loss: 0.048\n", "epoch: 158, batch: 1600 // loss: 0.052\n", "epoch: 158, batch: 1700 // loss: 0.045\n", "epoch: 158, batch: 1800 // loss: 0.053\n", "epoch: 158, batch: 1900 // loss: 0.045\n", "epoch: 158, batch: 2000 // loss: 0.047\n", "epoch: 158, batch: 2100 // loss: 0.046\n", "epoch: 158, batch: 2200 // loss: 0.050\n", "epoch: 158, batch: 2300 // loss: 0.049\n", "epoch: 158, batch: 2400 // loss: 0.042\n", "epoch: 158, batch: 2500 // loss: 0.042\n", "epoch: 158, batch: 2600 // loss: 0.045\n", "epoch: 158, batch: 2700 // loss: 0.042\n", "epoch: 158, batch: 2800 // loss: 0.046\n", "epoch: 158, batch: 2900 // loss: 0.042\n", "epoch: 158, batch: 3000 // loss: 0.045\n", "epoch: 158, batch: 3100 // loss: 0.043\n", "epoch: 158, batch: 3200 // loss: 0.039\n", "epoch: 158, batch: 3300 // loss: 0.038\n", "epoch: 158, batch: 3400 // loss: 0.044\n", "epoch: 158, batch: 3500 // loss: 0.035\n", "epoch: 158, batch: 3600 // loss: 0.043\n", "epoch: 158, batch: 3700 // loss: 0.043\n", "\n", "epoch: 159, batch: 0 // loss: 0.053\n", "epoch: 159, batch: 100 // loss: 0.046\n", "epoch: 159, batch: 200 // loss: 0.043\n", "epoch: 159, batch: 300 // loss: 0.049\n", "epoch: 159, batch: 400 // loss: 0.046\n", "epoch: 159, batch: 500 // loss: 0.040\n", "epoch: 159, batch: 600 // loss: 0.040\n", "epoch: 159, batch: 700 // loss: 0.044\n", "epoch: 159, batch: 800 // loss: 0.042\n", "epoch: 159, batch: 900 // loss: 0.049\n", "epoch: 159, batch: 1000 // loss: 0.046\n", "epoch: 159, batch: 1100 // loss: 0.042\n", "epoch: 159, batch: 1200 // loss: 0.044\n", "epoch: 159, batch: 1300 // loss: 0.046\n", "epoch: 159, batch: 1400 // loss: 0.043\n", "epoch: 159, batch: 1500 // loss: 0.048\n", "epoch: 159, batch: 1600 // loss: 0.052\n", "epoch: 159, batch: 1700 // loss: 0.045\n", "epoch: 159, batch: 1800 // loss: 0.053\n", "epoch: 159, batch: 1900 // loss: 0.045\n", "epoch: 159, batch: 2000 // loss: 0.047\n", "epoch: 159, batch: 2100 // loss: 0.046\n", "epoch: 159, batch: 2200 // loss: 0.050\n", "epoch: 159, batch: 2300 // loss: 0.049\n", "epoch: 159, batch: 2400 // loss: 0.042\n", "epoch: 159, batch: 2500 // loss: 0.042\n", "epoch: 159, batch: 2600 // loss: 0.045\n", "epoch: 159, batch: 2700 // loss: 0.042\n", "epoch: 159, batch: 2800 // loss: 0.046\n", "epoch: 159, batch: 2900 // loss: 0.042\n", "epoch: 159, batch: 3000 // loss: 0.045\n", "epoch: 159, batch: 3100 // loss: 0.043\n", "epoch: 159, batch: 3200 // loss: 0.039\n", "epoch: 159, batch: 3300 // loss: 0.038\n", "epoch: 159, batch: 3400 // loss: 0.044\n", "epoch: 159, batch: 3500 // loss: 0.035\n", "epoch: 159, batch: 3600 // loss: 0.043\n", "epoch: 159, batch: 3700 // loss: 0.043\n", "\n", "epoch: 160, batch: 0 // loss: 0.053\n", "epoch: 160, batch: 100 // loss: 0.046\n", "epoch: 160, batch: 200 // loss: 0.043\n", "epoch: 160, batch: 300 // loss: 0.049\n", "epoch: 160, batch: 400 // loss: 0.046\n", "epoch: 160, batch: 500 // loss: 0.040\n", "epoch: 160, batch: 600 // loss: 0.040\n", "epoch: 160, batch: 700 // loss: 0.044\n", "epoch: 160, batch: 800 // loss: 0.042\n", "epoch: 160, batch: 900 // loss: 0.049\n", "epoch: 160, batch: 1000 // loss: 0.046\n", "epoch: 160, batch: 1100 // loss: 0.042\n", "epoch: 160, batch: 1200 // loss: 0.044\n", "epoch: 160, batch: 1300 // loss: 0.046\n", "epoch: 160, batch: 1400 // loss: 0.043\n", "epoch: 160, batch: 1500 // loss: 0.048\n", "epoch: 160, batch: 1600 // loss: 0.052\n", "epoch: 160, batch: 1700 // loss: 0.045\n", "epoch: 160, batch: 1800 // loss: 0.053\n", "epoch: 160, batch: 1900 // loss: 0.045\n", "epoch: 160, batch: 2000 // loss: 0.047\n", "epoch: 160, batch: 2100 // loss: 0.046\n", "epoch: 160, batch: 2200 // loss: 0.050\n", "epoch: 160, batch: 2300 // loss: 0.049\n", "epoch: 160, batch: 2400 // loss: 0.042\n", "epoch: 160, batch: 2500 // loss: 0.042\n", "epoch: 160, batch: 2600 // loss: 0.045\n", "epoch: 160, batch: 2700 // loss: 0.042\n", "epoch: 160, batch: 2800 // loss: 0.046\n", "epoch: 160, batch: 2900 // loss: 0.042\n", "epoch: 160, batch: 3000 // loss: 0.045\n", "epoch: 160, batch: 3100 // loss: 0.043\n", "epoch: 160, batch: 3200 // loss: 0.039\n", "epoch: 160, batch: 3300 // loss: 0.038\n", "epoch: 160, batch: 3400 // loss: 0.044\n", "epoch: 160, batch: 3500 // loss: 0.035\n", "epoch: 160, batch: 3600 // loss: 0.043\n", "epoch: 160, batch: 3700 // loss: 0.043\n", "\n", "epoch: 161, batch: 0 // loss: 0.053\n", "epoch: 161, batch: 100 // loss: 0.046\n", "epoch: 161, batch: 200 // loss: 0.043\n", "epoch: 161, batch: 300 // loss: 0.049\n", "epoch: 161, batch: 400 // loss: 0.046\n", "epoch: 161, batch: 500 // loss: 0.040\n", "epoch: 161, batch: 600 // loss: 0.040\n", "epoch: 161, batch: 700 // loss: 0.044\n", "epoch: 161, batch: 800 // loss: 0.042\n", "epoch: 161, batch: 900 // loss: 0.049\n", "epoch: 161, batch: 1000 // loss: 0.046\n", "epoch: 161, batch: 1100 // loss: 0.042\n", "epoch: 161, batch: 1200 // loss: 0.044\n", "epoch: 161, batch: 1300 // loss: 0.046\n", "epoch: 161, batch: 1400 // loss: 0.043\n", "epoch: 161, batch: 1500 // loss: 0.048\n", "epoch: 161, batch: 1600 // loss: 0.052\n", "epoch: 161, batch: 1700 // loss: 0.045\n", "epoch: 161, batch: 1800 // loss: 0.053\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 161, batch: 1900 // loss: 0.045\n", "epoch: 161, batch: 2000 // loss: 0.047\n", "epoch: 161, batch: 2100 // loss: 0.046\n", "epoch: 161, batch: 2200 // loss: 0.050\n", "epoch: 161, batch: 2300 // loss: 0.049\n", "epoch: 161, batch: 2400 // loss: 0.042\n", "epoch: 161, batch: 2500 // loss: 0.042\n", "epoch: 161, batch: 2600 // loss: 0.045\n", "epoch: 161, batch: 2700 // loss: 0.042\n", "epoch: 161, batch: 2800 // loss: 0.046\n", "epoch: 161, batch: 2900 // loss: 0.042\n", "epoch: 161, batch: 3000 // loss: 0.045\n", "epoch: 161, batch: 3100 // loss: 0.043\n", "epoch: 161, batch: 3200 // loss: 0.039\n", "epoch: 161, batch: 3300 // loss: 0.038\n", "epoch: 161, batch: 3400 // loss: 0.044\n", "epoch: 161, batch: 3500 // loss: 0.035\n", "epoch: 161, batch: 3600 // loss: 0.043\n", "epoch: 161, batch: 3700 // loss: 0.043\n", "\n", "epoch: 162, batch: 0 // loss: 0.053\n", "epoch: 162, batch: 100 // loss: 0.046\n", "epoch: 162, batch: 200 // loss: 0.043\n", "epoch: 162, batch: 300 // loss: 0.049\n", "epoch: 162, batch: 400 // loss: 0.046\n", "epoch: 162, batch: 500 // loss: 0.040\n", "epoch: 162, batch: 600 // loss: 0.040\n", "epoch: 162, batch: 700 // loss: 0.044\n", "epoch: 162, batch: 800 // loss: 0.042\n", "epoch: 162, batch: 900 // loss: 0.049\n", "epoch: 162, batch: 1000 // loss: 0.046\n", "epoch: 162, batch: 1100 // loss: 0.042\n", "epoch: 162, batch: 1200 // loss: 0.044\n", "epoch: 162, batch: 1300 // loss: 0.046\n", "epoch: 162, batch: 1400 // loss: 0.043\n", "epoch: 162, batch: 1500 // loss: 0.048\n", "epoch: 162, batch: 1600 // loss: 0.052\n", "epoch: 162, batch: 1700 // loss: 0.045\n", "epoch: 162, batch: 1800 // loss: 0.053\n", "epoch: 162, batch: 1900 // loss: 0.045\n", "epoch: 162, batch: 2000 // loss: 0.047\n", "epoch: 162, batch: 2100 // loss: 0.046\n", "epoch: 162, batch: 2200 // loss: 0.050\n", "epoch: 162, batch: 2300 // loss: 0.049\n", "epoch: 162, batch: 2400 // loss: 0.042\n", "epoch: 162, batch: 2500 // loss: 0.042\n", "epoch: 162, batch: 2600 // loss: 0.045\n", "epoch: 162, batch: 2700 // loss: 0.042\n", "epoch: 162, batch: 2800 // loss: 0.046\n", "epoch: 162, batch: 2900 // loss: 0.042\n", "epoch: 162, batch: 3000 // loss: 0.045\n", "epoch: 162, batch: 3100 // loss: 0.043\n", "epoch: 162, batch: 3200 // loss: 0.039\n", "epoch: 162, batch: 3300 // loss: 0.038\n", "epoch: 162, batch: 3400 // loss: 0.044\n", "epoch: 162, batch: 3500 // loss: 0.035\n", "epoch: 162, batch: 3600 // loss: 0.043\n", "epoch: 162, batch: 3700 // loss: 0.043\n", "\n", "epoch: 163, batch: 0 // loss: 0.053\n", "epoch: 163, batch: 100 // loss: 0.046\n", "epoch: 163, batch: 200 // loss: 0.043\n", "epoch: 163, batch: 300 // loss: 0.049\n", "epoch: 163, batch: 400 // loss: 0.046\n", "epoch: 163, batch: 500 // loss: 0.040\n", "epoch: 163, batch: 600 // loss: 0.040\n", "epoch: 163, batch: 700 // loss: 0.044\n", "epoch: 163, batch: 800 // loss: 0.042\n", "epoch: 163, batch: 900 // loss: 0.049\n", "epoch: 163, batch: 1000 // loss: 0.046\n", "epoch: 163, batch: 1100 // loss: 0.042\n", "epoch: 163, batch: 1200 // loss: 0.044\n", "epoch: 163, batch: 1300 // loss: 0.046\n", "epoch: 163, batch: 1400 // loss: 0.043\n", "epoch: 163, batch: 1500 // loss: 0.048\n", "epoch: 163, batch: 1600 // loss: 0.052\n", "epoch: 163, batch: 1700 // loss: 0.045\n", "epoch: 163, batch: 1800 // loss: 0.053\n", "epoch: 163, batch: 1900 // loss: 0.045\n", "epoch: 163, batch: 2000 // loss: 0.047\n", "epoch: 163, batch: 2100 // loss: 0.046\n", "epoch: 163, batch: 2200 // loss: 0.050\n", "epoch: 163, batch: 2300 // loss: 0.049\n", "epoch: 163, batch: 2400 // loss: 0.042\n", "epoch: 163, batch: 2500 // loss: 0.042\n", "epoch: 163, batch: 2600 // loss: 0.045\n", "epoch: 163, batch: 2700 // loss: 0.042\n", "epoch: 163, batch: 2800 // loss: 0.046\n", "epoch: 163, batch: 2900 // loss: 0.042\n", "epoch: 163, batch: 3000 // loss: 0.045\n", "epoch: 163, batch: 3100 // loss: 0.043\n", "epoch: 163, batch: 3200 // loss: 0.039\n", "epoch: 163, batch: 3300 // loss: 0.038\n", "epoch: 163, batch: 3400 // loss: 0.044\n", "epoch: 163, batch: 3500 // loss: 0.035\n", "epoch: 163, batch: 3600 // loss: 0.043\n", "epoch: 163, batch: 3700 // loss: 0.043\n", "\n", "epoch: 164, batch: 0 // loss: 0.053\n", "epoch: 164, batch: 100 // loss: 0.046\n", "epoch: 164, batch: 200 // loss: 0.043\n", "epoch: 164, batch: 300 // loss: 0.049\n", "epoch: 164, batch: 400 // loss: 0.046\n", "epoch: 164, batch: 500 // loss: 0.040\n", "epoch: 164, batch: 600 // loss: 0.040\n", "epoch: 164, batch: 700 // loss: 0.044\n", "epoch: 164, batch: 800 // loss: 0.042\n", "epoch: 164, batch: 900 // loss: 0.049\n", "epoch: 164, batch: 1000 // loss: 0.046\n", "epoch: 164, batch: 1100 // loss: 0.042\n", "epoch: 164, batch: 1200 // loss: 0.044\n", "epoch: 164, batch: 1300 // loss: 0.046\n", "epoch: 164, batch: 1400 // loss: 0.043\n", "epoch: 164, batch: 1500 // loss: 0.048\n", "epoch: 164, batch: 1600 // loss: 0.052\n", "epoch: 164, batch: 1700 // loss: 0.045\n", "epoch: 164, batch: 1800 // loss: 0.053\n", "epoch: 164, batch: 1900 // loss: 0.045\n", "epoch: 164, batch: 2000 // loss: 0.047\n", "epoch: 164, batch: 2100 // loss: 0.046\n", "epoch: 164, batch: 2200 // loss: 0.050\n", "epoch: 164, batch: 2300 // loss: 0.049\n", "epoch: 164, batch: 2400 // loss: 0.042\n", "epoch: 164, batch: 2500 // loss: 0.042\n", "epoch: 164, batch: 2600 // loss: 0.045\n", "epoch: 164, batch: 2700 // loss: 0.042\n", "epoch: 164, batch: 2800 // loss: 0.046\n", "epoch: 164, batch: 2900 // loss: 0.042\n", "epoch: 164, batch: 3000 // loss: 0.045\n", "epoch: 164, batch: 3100 // loss: 0.043\n", "epoch: 164, batch: 3200 // loss: 0.039\n", "epoch: 164, batch: 3300 // loss: 0.038\n", "epoch: 164, batch: 3400 // loss: 0.044\n", "epoch: 164, batch: 3500 // loss: 0.035\n", "epoch: 164, batch: 3600 // loss: 0.043\n", "epoch: 164, batch: 3700 // loss: 0.043\n", "\n", "epoch: 165, batch: 0 // loss: 0.053\n", "epoch: 165, batch: 100 // loss: 0.046\n", "epoch: 165, batch: 200 // loss: 0.043\n", "epoch: 165, batch: 300 // loss: 0.049\n", "epoch: 165, batch: 400 // loss: 0.046\n", "epoch: 165, batch: 500 // loss: 0.040\n", "epoch: 165, batch: 600 // loss: 0.040\n", "epoch: 165, batch: 700 // loss: 0.044\n", "epoch: 165, batch: 800 // loss: 0.042\n", "epoch: 165, batch: 900 // loss: 0.049\n", "epoch: 165, batch: 1000 // loss: 0.046\n", "epoch: 165, batch: 1100 // loss: 0.042\n", "epoch: 165, batch: 1200 // loss: 0.044\n", "epoch: 165, batch: 1300 // loss: 0.046\n", "epoch: 165, batch: 1400 // loss: 0.043\n", "epoch: 165, batch: 1500 // loss: 0.048\n", "epoch: 165, batch: 1600 // loss: 0.052\n", "epoch: 165, batch: 1700 // loss: 0.045\n", "epoch: 165, batch: 1800 // loss: 0.053\n", "epoch: 165, batch: 1900 // loss: 0.045\n", "epoch: 165, batch: 2000 // loss: 0.047\n", "epoch: 165, batch: 2100 // loss: 0.046\n", "epoch: 165, batch: 2200 // loss: 0.050\n", "epoch: 165, batch: 2300 // loss: 0.049\n", "epoch: 165, batch: 2400 // loss: 0.042\n", "epoch: 165, batch: 2500 // loss: 0.042\n", "epoch: 165, batch: 2600 // loss: 0.045\n", "epoch: 165, batch: 2700 // loss: 0.042\n", "epoch: 165, batch: 2800 // loss: 0.046\n", "epoch: 165, batch: 2900 // loss: 0.042\n", "epoch: 165, batch: 3000 // loss: 0.045\n", "epoch: 165, batch: 3100 // loss: 0.043\n", "epoch: 165, batch: 3200 // loss: 0.039\n", "epoch: 165, batch: 3300 // loss: 0.038\n", "epoch: 165, batch: 3400 // loss: 0.044\n", "epoch: 165, batch: 3500 // loss: 0.035\n", "epoch: 165, batch: 3600 // loss: 0.043\n", "epoch: 165, batch: 3700 // loss: 0.043\n", "\n", "epoch: 166, batch: 0 // loss: 0.053\n", "epoch: 166, batch: 100 // loss: 0.046\n", "epoch: 166, batch: 200 // loss: 0.043\n", "epoch: 166, batch: 300 // loss: 0.049\n", "epoch: 166, batch: 400 // loss: 0.046\n", "epoch: 166, batch: 500 // loss: 0.040\n", "epoch: 166, batch: 600 // loss: 0.040\n", "epoch: 166, batch: 700 // loss: 0.044\n", "epoch: 166, batch: 800 // loss: 0.042\n", "epoch: 166, batch: 900 // loss: 0.049\n", "epoch: 166, batch: 1000 // loss: 0.046\n", "epoch: 166, batch: 1100 // loss: 0.042\n", "epoch: 166, batch: 1200 // loss: 0.044\n", "epoch: 166, batch: 1300 // loss: 0.046\n", "epoch: 166, batch: 1400 // loss: 0.043\n", "epoch: 166, batch: 1500 // loss: 0.048\n", "epoch: 166, batch: 1600 // loss: 0.052\n", "epoch: 166, batch: 1700 // loss: 0.045\n", "epoch: 166, batch: 1800 // loss: 0.053\n", "epoch: 166, batch: 1900 // loss: 0.045\n", "epoch: 166, batch: 2000 // loss: 0.047\n", "epoch: 166, batch: 2100 // loss: 0.046\n", "epoch: 166, batch: 2200 // loss: 0.050\n", "epoch: 166, batch: 2300 // loss: 0.049\n", "epoch: 166, batch: 2400 // loss: 0.042\n", "epoch: 166, batch: 2500 // loss: 0.042\n", "epoch: 166, batch: 2600 // loss: 0.045\n", "epoch: 166, batch: 2700 // loss: 0.042\n", "epoch: 166, batch: 2800 // loss: 0.046\n", "epoch: 166, batch: 2900 // loss: 0.042\n", "epoch: 166, batch: 3000 // loss: 0.045\n", "epoch: 166, batch: 3100 // loss: 0.043\n", "epoch: 166, batch: 3200 // loss: 0.039\n", "epoch: 166, batch: 3300 // loss: 0.038\n", "epoch: 166, batch: 3400 // loss: 0.044\n", "epoch: 166, batch: 3500 // loss: 0.035\n", "epoch: 166, batch: 3600 // loss: 0.043\n", "epoch: 166, batch: 3700 // loss: 0.043\n", "\n", "epoch: 167, batch: 0 // loss: 0.053\n", "epoch: 167, batch: 100 // loss: 0.046\n", "epoch: 167, batch: 200 // loss: 0.043\n", "epoch: 167, batch: 300 // loss: 0.049\n", "epoch: 167, batch: 400 // loss: 0.046\n", "epoch: 167, batch: 500 // loss: 0.040\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 167, batch: 600 // loss: 0.040\n", "epoch: 167, batch: 700 // loss: 0.044\n", "epoch: 167, batch: 800 // loss: 0.042\n", "epoch: 167, batch: 900 // loss: 0.049\n", "epoch: 167, batch: 1000 // loss: 0.046\n", "epoch: 167, batch: 1100 // loss: 0.042\n", "epoch: 167, batch: 1200 // loss: 0.044\n", "epoch: 167, batch: 1300 // loss: 0.046\n", "epoch: 167, batch: 1400 // loss: 0.043\n", "epoch: 167, batch: 1500 // loss: 0.048\n", "epoch: 167, batch: 1600 // loss: 0.052\n", "epoch: 167, batch: 1700 // loss: 0.045\n", "epoch: 167, batch: 1800 // loss: 0.053\n", "epoch: 167, batch: 1900 // loss: 0.045\n", "epoch: 167, batch: 2000 // loss: 0.047\n", "epoch: 167, batch: 2100 // loss: 0.046\n", "epoch: 167, batch: 2200 // loss: 0.050\n", "epoch: 167, batch: 2300 // loss: 0.049\n", "epoch: 167, batch: 2400 // loss: 0.042\n", "epoch: 167, batch: 2500 // loss: 0.042\n", "epoch: 167, batch: 2600 // loss: 0.045\n", "epoch: 167, batch: 2700 // loss: 0.042\n", "epoch: 167, batch: 2800 // loss: 0.046\n", "epoch: 167, batch: 2900 // loss: 0.042\n", "epoch: 167, batch: 3000 // loss: 0.045\n", "epoch: 167, batch: 3100 // loss: 0.043\n", "epoch: 167, batch: 3200 // loss: 0.039\n", "epoch: 167, batch: 3300 // loss: 0.038\n", "epoch: 167, batch: 3400 // loss: 0.044\n", "epoch: 167, batch: 3500 // loss: 0.035\n", "epoch: 167, batch: 3600 // loss: 0.043\n", "epoch: 167, batch: 3700 // loss: 0.043\n", "\n", "epoch: 168, batch: 0 // loss: 0.053\n", "epoch: 168, batch: 100 // loss: 0.046\n", "epoch: 168, batch: 200 // loss: 0.043\n", "epoch: 168, batch: 300 // loss: 0.049\n", "epoch: 168, batch: 400 // loss: 0.046\n", "epoch: 168, batch: 500 // loss: 0.040\n", "epoch: 168, batch: 600 // loss: 0.040\n", "epoch: 168, batch: 700 // loss: 0.044\n", "epoch: 168, batch: 800 // loss: 0.042\n", "epoch: 168, batch: 900 // loss: 0.049\n", "epoch: 168, batch: 1000 // loss: 0.046\n", "epoch: 168, batch: 1100 // loss: 0.042\n", "epoch: 168, batch: 1200 // loss: 0.044\n", "epoch: 168, batch: 1300 // loss: 0.046\n", "epoch: 168, batch: 1400 // loss: 0.043\n", "epoch: 168, batch: 1500 // loss: 0.048\n", "epoch: 168, batch: 1600 // loss: 0.052\n", "epoch: 168, batch: 1700 // loss: 0.045\n", "epoch: 168, batch: 1800 // loss: 0.053\n", "epoch: 168, batch: 1900 // loss: 0.045\n", "epoch: 168, batch: 2000 // loss: 0.047\n", "epoch: 168, batch: 2100 // loss: 0.046\n", "epoch: 168, batch: 2200 // loss: 0.050\n", "epoch: 168, batch: 2300 // loss: 0.049\n", "epoch: 168, batch: 2400 // loss: 0.042\n", "epoch: 168, batch: 2500 // loss: 0.042\n", "epoch: 168, batch: 2600 // loss: 0.045\n", "epoch: 168, batch: 2700 // loss: 0.042\n", "epoch: 168, batch: 2800 // loss: 0.046\n", "epoch: 168, batch: 2900 // loss: 0.042\n", "epoch: 168, batch: 3000 // loss: 0.045\n", "epoch: 168, batch: 3100 // loss: 0.043\n", "epoch: 168, batch: 3200 // loss: 0.039\n", "epoch: 168, batch: 3300 // loss: 0.038\n", "epoch: 168, batch: 3400 // loss: 0.044\n", "epoch: 168, batch: 3500 // loss: 0.035\n", "epoch: 168, batch: 3600 // loss: 0.043\n", "epoch: 168, batch: 3700 // loss: 0.043\n", "\n", "epoch: 169, batch: 0 // loss: 0.053\n", "epoch: 169, batch: 100 // loss: 0.046\n", "epoch: 169, batch: 200 // loss: 0.043\n", "epoch: 169, batch: 300 // loss: 0.049\n", "epoch: 169, batch: 400 // loss: 0.046\n", "epoch: 169, batch: 500 // loss: 0.040\n", "epoch: 169, batch: 600 // loss: 0.040\n", "epoch: 169, batch: 700 // loss: 0.044\n", "epoch: 169, batch: 800 // loss: 0.042\n", "epoch: 169, batch: 900 // loss: 0.049\n", "epoch: 169, batch: 1000 // loss: 0.046\n", "epoch: 169, batch: 1100 // loss: 0.042\n", "epoch: 169, batch: 1200 // loss: 0.044\n", "epoch: 169, batch: 1300 // loss: 0.046\n", "epoch: 169, batch: 1400 // loss: 0.043\n", "epoch: 169, batch: 1500 // loss: 0.048\n", "epoch: 169, batch: 1600 // loss: 0.052\n", "epoch: 169, batch: 1700 // loss: 0.045\n", "epoch: 169, batch: 1800 // loss: 0.053\n", "epoch: 169, batch: 1900 // loss: 0.045\n", "epoch: 169, batch: 2000 // loss: 0.047\n", "epoch: 169, batch: 2100 // loss: 0.046\n", "epoch: 169, batch: 2200 // loss: 0.050\n", "epoch: 169, batch: 2300 // loss: 0.049\n", "epoch: 169, batch: 2400 // loss: 0.042\n", "epoch: 169, batch: 2500 // loss: 0.042\n", "epoch: 169, batch: 2600 // loss: 0.045\n", "epoch: 169, batch: 2700 // loss: 0.042\n", "epoch: 169, batch: 2800 // loss: 0.046\n", "epoch: 169, batch: 2900 // loss: 0.042\n", "epoch: 169, batch: 3000 // loss: 0.045\n", "epoch: 169, batch: 3100 // loss: 0.043\n", "epoch: 169, batch: 3200 // loss: 0.039\n", "epoch: 169, batch: 3300 // loss: 0.038\n", "epoch: 169, batch: 3400 // loss: 0.044\n", "epoch: 169, batch: 3500 // loss: 0.035\n", "epoch: 169, batch: 3600 // loss: 0.043\n", "epoch: 169, batch: 3700 // loss: 0.043\n", "\n", "epoch: 170, batch: 0 // loss: 0.053\n", "epoch: 170, batch: 100 // loss: 0.046\n", "epoch: 170, batch: 200 // loss: 0.043\n", "epoch: 170, batch: 300 // loss: 0.049\n", "epoch: 170, batch: 400 // loss: 0.046\n", "epoch: 170, batch: 500 // loss: 0.040\n", "epoch: 170, batch: 600 // loss: 0.040\n", "epoch: 170, batch: 700 // loss: 0.044\n", "epoch: 170, batch: 800 // loss: 0.042\n", "epoch: 170, batch: 900 // loss: 0.049\n", "epoch: 170, batch: 1000 // loss: 0.046\n", "epoch: 170, batch: 1100 // loss: 0.042\n", "epoch: 170, batch: 1200 // loss: 0.044\n", "epoch: 170, batch: 1300 // loss: 0.046\n", "epoch: 170, batch: 1400 // loss: 0.043\n", "epoch: 170, batch: 1500 // loss: 0.048\n", "epoch: 170, batch: 1600 // loss: 0.052\n", "epoch: 170, batch: 1700 // loss: 0.045\n", "epoch: 170, batch: 1800 // loss: 0.053\n", "epoch: 170, batch: 1900 // loss: 0.045\n", "epoch: 170, batch: 2000 // loss: 0.047\n", "epoch: 170, batch: 2100 // loss: 0.046\n", "epoch: 170, batch: 2200 // loss: 0.050\n", "epoch: 170, batch: 2300 // loss: 0.049\n", "epoch: 170, batch: 2400 // loss: 0.042\n", "epoch: 170, batch: 2500 // loss: 0.042\n", "epoch: 170, batch: 2600 // loss: 0.045\n", "epoch: 170, batch: 2700 // loss: 0.042\n", "epoch: 170, batch: 2800 // loss: 0.046\n", "epoch: 170, batch: 2900 // loss: 0.042\n", "epoch: 170, batch: 3000 // loss: 0.045\n", "epoch: 170, batch: 3100 // loss: 0.043\n", "epoch: 170, batch: 3200 // loss: 0.039\n", "epoch: 170, batch: 3300 // loss: 0.038\n", "epoch: 170, batch: 3400 // loss: 0.044\n", "epoch: 170, batch: 3500 // loss: 0.035\n", "epoch: 170, batch: 3600 // loss: 0.043\n", "epoch: 170, batch: 3700 // loss: 0.043\n", "\n", "epoch: 171, batch: 0 // loss: 0.053\n", "epoch: 171, batch: 100 // loss: 0.046\n", "epoch: 171, batch: 200 // loss: 0.043\n", "epoch: 171, batch: 300 // loss: 0.049\n", "epoch: 171, batch: 400 // loss: 0.046\n", "epoch: 171, batch: 500 // loss: 0.040\n", "epoch: 171, batch: 600 // loss: 0.040\n", "epoch: 171, batch: 700 // loss: 0.044\n", "epoch: 171, batch: 800 // loss: 0.042\n", "epoch: 171, batch: 900 // loss: 0.049\n", "epoch: 171, batch: 1000 // loss: 0.046\n", "epoch: 171, batch: 1100 // loss: 0.042\n", "epoch: 171, batch: 1200 // loss: 0.044\n", "epoch: 171, batch: 1300 // loss: 0.046\n", "epoch: 171, batch: 1400 // loss: 0.043\n", "epoch: 171, batch: 1500 // loss: 0.048\n", "epoch: 171, batch: 1600 // loss: 0.052\n", "epoch: 171, batch: 1700 // loss: 0.045\n", "epoch: 171, batch: 1800 // loss: 0.053\n", "epoch: 171, batch: 1900 // loss: 0.045\n", "epoch: 171, batch: 2000 // loss: 0.047\n", "epoch: 171, batch: 2100 // loss: 0.046\n", "epoch: 171, batch: 2200 // loss: 0.050\n", "epoch: 171, batch: 2300 // loss: 0.049\n", "epoch: 171, batch: 2400 // loss: 0.042\n", "epoch: 171, batch: 2500 // loss: 0.042\n", "epoch: 171, batch: 2600 // loss: 0.045\n", "epoch: 171, batch: 2700 // loss: 0.042\n", "epoch: 171, batch: 2800 // loss: 0.046\n", "epoch: 171, batch: 2900 // loss: 0.042\n", "epoch: 171, batch: 3000 // loss: 0.045\n", "epoch: 171, batch: 3100 // loss: 0.043\n", "epoch: 171, batch: 3200 // loss: 0.039\n", "epoch: 171, batch: 3300 // loss: 0.038\n", "epoch: 171, batch: 3400 // loss: 0.044\n", "epoch: 171, batch: 3500 // loss: 0.035\n", "epoch: 171, batch: 3600 // loss: 0.043\n", "epoch: 171, batch: 3700 // loss: 0.043\n", "\n", "epoch: 172, batch: 0 // loss: 0.053\n", "epoch: 172, batch: 100 // loss: 0.046\n", "epoch: 172, batch: 200 // loss: 0.043\n", "epoch: 172, batch: 300 // loss: 0.049\n", "epoch: 172, batch: 400 // loss: 0.046\n", "epoch: 172, batch: 500 // loss: 0.040\n", "epoch: 172, batch: 600 // loss: 0.040\n", "epoch: 172, batch: 700 // loss: 0.044\n", "epoch: 172, batch: 800 // loss: 0.042\n", "epoch: 172, batch: 900 // loss: 0.049\n", "epoch: 172, batch: 1000 // loss: 0.046\n", "epoch: 172, batch: 1100 // loss: 0.042\n", "epoch: 172, batch: 1200 // loss: 0.044\n", "epoch: 172, batch: 1300 // loss: 0.046\n", "epoch: 172, batch: 1400 // loss: 0.043\n", "epoch: 172, batch: 1500 // loss: 0.048\n", "epoch: 172, batch: 1600 // loss: 0.052\n", "epoch: 172, batch: 1700 // loss: 0.045\n", "epoch: 172, batch: 1800 // loss: 0.053\n", "epoch: 172, batch: 1900 // loss: 0.045\n", "epoch: 172, batch: 2000 // loss: 0.047\n", "epoch: 172, batch: 2100 // loss: 0.046\n", "epoch: 172, batch: 2200 // loss: 0.050\n", "epoch: 172, batch: 2300 // loss: 0.049\n", "epoch: 172, batch: 2400 // loss: 0.042\n", "epoch: 172, batch: 2500 // loss: 0.042\n", "epoch: 172, batch: 2600 // loss: 0.045\n", "epoch: 172, batch: 2700 // loss: 0.042\n", "epoch: 172, batch: 2800 // loss: 0.046\n", "epoch: 172, batch: 2900 // loss: 0.042\n", "epoch: 172, batch: 3000 // loss: 0.045\n", "epoch: 172, batch: 3100 // loss: 0.043\n", "epoch: 172, batch: 3200 // loss: 0.039\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 172, batch: 3300 // loss: 0.038\n", "epoch: 172, batch: 3400 // loss: 0.044\n", "epoch: 172, batch: 3500 // loss: 0.035\n", "epoch: 172, batch: 3600 // loss: 0.043\n", "epoch: 172, batch: 3700 // loss: 0.043\n", "\n", "epoch: 173, batch: 0 // loss: 0.053\n", "epoch: 173, batch: 100 // loss: 0.046\n", "epoch: 173, batch: 200 // loss: 0.043\n", "epoch: 173, batch: 300 // loss: 0.049\n", "epoch: 173, batch: 400 // loss: 0.046\n", "epoch: 173, batch: 500 // loss: 0.040\n", "epoch: 173, batch: 600 // loss: 0.040\n", "epoch: 173, batch: 700 // loss: 0.044\n", "epoch: 173, batch: 800 // loss: 0.042\n", "epoch: 173, batch: 900 // loss: 0.049\n", "epoch: 173, batch: 1000 // loss: 0.046\n", "epoch: 173, batch: 1100 // loss: 0.042\n", "epoch: 173, batch: 1200 // loss: 0.044\n", "epoch: 173, batch: 1300 // loss: 0.046\n", "epoch: 173, batch: 1400 // loss: 0.043\n", "epoch: 173, batch: 1500 // loss: 0.048\n", "epoch: 173, batch: 1600 // loss: 0.052\n", "epoch: 173, batch: 1700 // loss: 0.045\n", "epoch: 173, batch: 1800 // loss: 0.053\n", "epoch: 173, batch: 1900 // loss: 0.045\n", "epoch: 173, batch: 2000 // loss: 0.047\n", "epoch: 173, batch: 2100 // loss: 0.046\n", "epoch: 173, batch: 2200 // loss: 0.050\n", "epoch: 173, batch: 2300 // loss: 0.049\n", "epoch: 173, batch: 2400 // loss: 0.042\n", "epoch: 173, batch: 2500 // loss: 0.042\n", "epoch: 173, batch: 2600 // loss: 0.045\n", "epoch: 173, batch: 2700 // loss: 0.042\n", "epoch: 173, batch: 2800 // loss: 0.046\n", "epoch: 173, batch: 2900 // loss: 0.042\n", "epoch: 173, batch: 3000 // loss: 0.045\n", "epoch: 173, batch: 3100 // loss: 0.043\n", "epoch: 173, batch: 3200 // loss: 0.039\n", "epoch: 173, batch: 3300 // loss: 0.038\n", "epoch: 173, batch: 3400 // loss: 0.044\n", "epoch: 173, batch: 3500 // loss: 0.035\n", "epoch: 173, batch: 3600 // loss: 0.043\n", "epoch: 173, batch: 3700 // loss: 0.043\n", "\n", "epoch: 174, batch: 0 // loss: 0.053\n", "epoch: 174, batch: 100 // loss: 0.046\n", "epoch: 174, batch: 200 // loss: 0.043\n", "epoch: 174, batch: 300 // loss: 0.049\n", "epoch: 174, batch: 400 // loss: 0.046\n", "epoch: 174, batch: 500 // loss: 0.040\n", "epoch: 174, batch: 600 // loss: 0.040\n", "epoch: 174, batch: 700 // loss: 0.044\n", "epoch: 174, batch: 800 // loss: 0.042\n", "epoch: 174, batch: 900 // loss: 0.049\n", "epoch: 174, batch: 1000 // loss: 0.046\n", "epoch: 174, batch: 1100 // loss: 0.042\n", "epoch: 174, batch: 1200 // loss: 0.044\n", "epoch: 174, batch: 1300 // loss: 0.046\n", "epoch: 174, batch: 1400 // loss: 0.043\n", "epoch: 174, batch: 1500 // loss: 0.048\n", "epoch: 174, batch: 1600 // loss: 0.052\n", "epoch: 174, batch: 1700 // loss: 0.045\n", "epoch: 174, batch: 1800 // loss: 0.053\n", "epoch: 174, batch: 1900 // loss: 0.045\n", "epoch: 174, batch: 2000 // loss: 0.047\n", "epoch: 174, batch: 2100 // loss: 0.046\n", "epoch: 174, batch: 2200 // loss: 0.050\n", "epoch: 174, batch: 2300 // loss: 0.049\n", "epoch: 174, batch: 2400 // loss: 0.042\n", "epoch: 174, batch: 2500 // loss: 0.042\n", "epoch: 174, batch: 2600 // loss: 0.045\n", "epoch: 174, batch: 2700 // loss: 0.042\n", "epoch: 174, batch: 2800 // loss: 0.046\n", "epoch: 174, batch: 2900 // loss: 0.042\n", "epoch: 174, batch: 3000 // loss: 0.045\n", "epoch: 174, batch: 3100 // loss: 0.043\n", "epoch: 174, batch: 3200 // loss: 0.039\n", "epoch: 174, batch: 3300 // loss: 0.038\n", "epoch: 174, batch: 3400 // loss: 0.044\n", "epoch: 174, batch: 3500 // loss: 0.035\n", "epoch: 174, batch: 3600 // loss: 0.043\n", "epoch: 174, batch: 3700 // loss: 0.043\n", "\n", "epoch: 175, batch: 0 // loss: 0.053\n", "epoch: 175, batch: 100 // loss: 0.046\n", "epoch: 175, batch: 200 // loss: 0.043\n", "epoch: 175, batch: 300 // loss: 0.049\n", "epoch: 175, batch: 400 // loss: 0.046\n", "epoch: 175, batch: 500 // loss: 0.040\n", "epoch: 175, batch: 600 // loss: 0.040\n", "epoch: 175, batch: 700 // loss: 0.044\n", "epoch: 175, batch: 800 // loss: 0.042\n", "epoch: 175, batch: 900 // loss: 0.049\n", "epoch: 175, batch: 1000 // loss: 0.046\n", "epoch: 175, batch: 1100 // loss: 0.042\n", "epoch: 175, batch: 1200 // loss: 0.044\n", "epoch: 175, batch: 1300 // loss: 0.046\n", "epoch: 175, batch: 1400 // loss: 0.043\n", "epoch: 175, batch: 1500 // loss: 0.048\n", "epoch: 175, batch: 1600 // loss: 0.052\n", "epoch: 175, batch: 1700 // loss: 0.045\n", "epoch: 175, batch: 1800 // loss: 0.053\n", "epoch: 175, batch: 1900 // loss: 0.045\n", "epoch: 175, batch: 2000 // loss: 0.047\n", "epoch: 175, batch: 2100 // loss: 0.046\n", "epoch: 175, batch: 2200 // loss: 0.050\n", "epoch: 175, batch: 2300 // loss: 0.049\n", "epoch: 175, batch: 2400 // loss: 0.042\n", "epoch: 175, batch: 2500 // loss: 0.042\n", "epoch: 175, batch: 2600 // loss: 0.045\n", "epoch: 175, batch: 2700 // loss: 0.042\n", "epoch: 175, batch: 2800 // loss: 0.046\n", "epoch: 175, batch: 2900 // loss: 0.042\n", "epoch: 175, batch: 3000 // loss: 0.045\n", "epoch: 175, batch: 3100 // loss: 0.043\n", "epoch: 175, batch: 3200 // loss: 0.039\n", "epoch: 175, batch: 3300 // loss: 0.038\n", "epoch: 175, batch: 3400 // loss: 0.044\n", "epoch: 175, batch: 3500 // loss: 0.035\n", "epoch: 175, batch: 3600 // loss: 0.043\n", "epoch: 175, batch: 3700 // loss: 0.043\n", "\n", "epoch: 176, batch: 0 // loss: 0.053\n", "epoch: 176, batch: 100 // loss: 0.046\n", "epoch: 176, batch: 200 // loss: 0.043\n", "epoch: 176, batch: 300 // loss: 0.049\n", "epoch: 176, batch: 400 // loss: 0.046\n", "epoch: 176, batch: 500 // loss: 0.040\n", "epoch: 176, batch: 600 // loss: 0.040\n", "epoch: 176, batch: 700 // loss: 0.044\n", "epoch: 176, batch: 800 // loss: 0.042\n", "epoch: 176, batch: 900 // loss: 0.049\n", "epoch: 176, batch: 1000 // loss: 0.046\n", "epoch: 176, batch: 1100 // loss: 0.042\n", "epoch: 176, batch: 1200 // loss: 0.044\n", "epoch: 176, batch: 1300 // loss: 0.046\n", "epoch: 176, batch: 1400 // loss: 0.043\n", "epoch: 176, batch: 1500 // loss: 0.048\n", "epoch: 176, batch: 1600 // loss: 0.052\n", "epoch: 176, batch: 1700 // loss: 0.045\n", "epoch: 176, batch: 1800 // loss: 0.053\n", "epoch: 176, batch: 1900 // loss: 0.045\n", "epoch: 176, batch: 2000 // loss: 0.047\n", "epoch: 176, batch: 2100 // loss: 0.046\n", "epoch: 176, batch: 2200 // loss: 0.050\n", "epoch: 176, batch: 2300 // loss: 0.049\n", "epoch: 176, batch: 2400 // loss: 0.042\n", "epoch: 176, batch: 2500 // loss: 0.042\n", "epoch: 176, batch: 2600 // loss: 0.045\n", "epoch: 176, batch: 2700 // loss: 0.042\n", "epoch: 176, batch: 2800 // loss: 0.046\n", "epoch: 176, batch: 2900 // loss: 0.042\n", "epoch: 176, batch: 3000 // loss: 0.045\n", "epoch: 176, batch: 3100 // loss: 0.043\n", "epoch: 176, batch: 3200 // loss: 0.039\n", "epoch: 176, batch: 3300 // loss: 0.038\n", "epoch: 176, batch: 3400 // loss: 0.044\n", "epoch: 176, batch: 3500 // loss: 0.035\n", "epoch: 176, batch: 3600 // loss: 0.043\n", "epoch: 176, batch: 3700 // loss: 0.043\n", "\n", "epoch: 177, batch: 0 // loss: 0.053\n", "epoch: 177, batch: 100 // loss: 0.046\n", "epoch: 177, batch: 200 // loss: 0.043\n", "epoch: 177, batch: 300 // loss: 0.049\n", "epoch: 177, batch: 400 // loss: 0.046\n", "epoch: 177, batch: 500 // loss: 0.040\n", "epoch: 177, batch: 600 // loss: 0.040\n", "epoch: 177, batch: 700 // loss: 0.044\n", "epoch: 177, batch: 800 // loss: 0.042\n", "epoch: 177, batch: 900 // loss: 0.049\n", "epoch: 177, batch: 1000 // loss: 0.046\n", "epoch: 177, batch: 1100 // loss: 0.042\n", "epoch: 177, batch: 1200 // loss: 0.044\n", "epoch: 177, batch: 1300 // loss: 0.046\n", "epoch: 177, batch: 1400 // loss: 0.043\n", "epoch: 177, batch: 1500 // loss: 0.048\n", "epoch: 177, batch: 1600 // loss: 0.052\n", "epoch: 177, batch: 1700 // loss: 0.045\n", "epoch: 177, batch: 1800 // loss: 0.053\n", "epoch: 177, batch: 1900 // loss: 0.045\n", "epoch: 177, batch: 2000 // loss: 0.047\n", "epoch: 177, batch: 2100 // loss: 0.046\n", "epoch: 177, batch: 2200 // loss: 0.050\n", "epoch: 177, batch: 2300 // loss: 0.049\n", "epoch: 177, batch: 2400 // loss: 0.042\n", "epoch: 177, batch: 2500 // loss: 0.042\n", "epoch: 177, batch: 2600 // loss: 0.045\n", "epoch: 177, batch: 2700 // loss: 0.042\n", "epoch: 177, batch: 2800 // loss: 0.046\n", "epoch: 177, batch: 2900 // loss: 0.042\n", "epoch: 177, batch: 3000 // loss: 0.045\n", "epoch: 177, batch: 3100 // loss: 0.043\n", "epoch: 177, batch: 3200 // loss: 0.039\n", "epoch: 177, batch: 3300 // loss: 0.038\n", "epoch: 177, batch: 3400 // loss: 0.044\n", "epoch: 177, batch: 3500 // loss: 0.035\n", "epoch: 177, batch: 3600 // loss: 0.043\n", "epoch: 177, batch: 3700 // loss: 0.043\n", "\n", "epoch: 178, batch: 0 // loss: 0.053\n", "epoch: 178, batch: 100 // loss: 0.046\n", "epoch: 178, batch: 200 // loss: 0.043\n", "epoch: 178, batch: 300 // loss: 0.049\n", "epoch: 178, batch: 400 // loss: 0.046\n", "epoch: 178, batch: 500 // loss: 0.040\n", "epoch: 178, batch: 600 // loss: 0.040\n", "epoch: 178, batch: 700 // loss: 0.044\n", "epoch: 178, batch: 800 // loss: 0.042\n", "epoch: 178, batch: 900 // loss: 0.049\n", "epoch: 178, batch: 1000 // loss: 0.046\n", "epoch: 178, batch: 1100 // loss: 0.042\n", "epoch: 178, batch: 1200 // loss: 0.044\n", "epoch: 178, batch: 1300 // loss: 0.046\n", "epoch: 178, batch: 1400 // loss: 0.043\n", "epoch: 178, batch: 1500 // loss: 0.048\n", "epoch: 178, batch: 1600 // loss: 0.052\n", "epoch: 178, batch: 1700 // loss: 0.045\n", "epoch: 178, batch: 1800 // loss: 0.053\n", "epoch: 178, batch: 1900 // loss: 0.045\n", "epoch: 178, batch: 2000 // loss: 0.047\n", "epoch: 178, batch: 2100 // loss: 0.046\n", "epoch: 178, batch: 2200 // loss: 0.050\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 178, batch: 2300 // loss: 0.049\n", "epoch: 178, batch: 2400 // loss: 0.042\n", "epoch: 178, batch: 2500 // loss: 0.042\n", "epoch: 178, batch: 2600 // loss: 0.045\n", "epoch: 178, batch: 2700 // loss: 0.042\n", "epoch: 178, batch: 2800 // loss: 0.046\n", "epoch: 178, batch: 2900 // loss: 0.042\n", "epoch: 178, batch: 3000 // loss: 0.045\n", "epoch: 178, batch: 3100 // loss: 0.043\n", "epoch: 178, batch: 3200 // loss: 0.039\n", "epoch: 178, batch: 3300 // loss: 0.038\n", "epoch: 178, batch: 3400 // loss: 0.044\n", "epoch: 178, batch: 3500 // loss: 0.035\n", "epoch: 178, batch: 3600 // loss: 0.043\n", "epoch: 178, batch: 3700 // loss: 0.043\n", "\n", "epoch: 179, batch: 0 // loss: 0.053\n", "epoch: 179, batch: 100 // loss: 0.046\n", "epoch: 179, batch: 200 // loss: 0.043\n", "epoch: 179, batch: 300 // loss: 0.049\n", "epoch: 179, batch: 400 // loss: 0.046\n", "epoch: 179, batch: 500 // loss: 0.040\n", "epoch: 179, batch: 600 // loss: 0.040\n", "epoch: 179, batch: 700 // loss: 0.044\n", "epoch: 179, batch: 800 // loss: 0.042\n", "epoch: 179, batch: 900 // loss: 0.049\n", "epoch: 179, batch: 1000 // loss: 0.046\n", "epoch: 179, batch: 1100 // loss: 0.042\n", "epoch: 179, batch: 1200 // loss: 0.044\n", "epoch: 179, batch: 1300 // loss: 0.046\n", "epoch: 179, batch: 1400 // loss: 0.043\n", "epoch: 179, batch: 1500 // loss: 0.048\n", "epoch: 179, batch: 1600 // loss: 0.052\n", "epoch: 179, batch: 1700 // loss: 0.045\n", "epoch: 179, batch: 1800 // loss: 0.053\n", "epoch: 179, batch: 1900 // loss: 0.045\n", "epoch: 179, batch: 2000 // loss: 0.047\n", "epoch: 179, batch: 2100 // loss: 0.046\n", "epoch: 179, batch: 2200 // loss: 0.050\n", "epoch: 179, batch: 2300 // loss: 0.049\n", "epoch: 179, batch: 2400 // loss: 0.042\n", "epoch: 179, batch: 2500 // loss: 0.042\n", "epoch: 179, batch: 2600 // loss: 0.045\n", "epoch: 179, batch: 2700 // loss: 0.042\n", "epoch: 179, batch: 2800 // loss: 0.046\n", "epoch: 179, batch: 2900 // loss: 0.042\n", "epoch: 179, batch: 3000 // loss: 0.045\n", "epoch: 179, batch: 3100 // loss: 0.043\n", "epoch: 179, batch: 3200 // loss: 0.039\n", "epoch: 179, batch: 3300 // loss: 0.038\n", "epoch: 179, batch: 3400 // loss: 0.044\n", "epoch: 179, batch: 3500 // loss: 0.035\n", "epoch: 179, batch: 3600 // loss: 0.043\n", "epoch: 179, batch: 3700 // loss: 0.043\n", "\n", "epoch: 180, batch: 0 // loss: 0.053\n", "epoch: 180, batch: 100 // loss: 0.046\n", "epoch: 180, batch: 200 // loss: 0.043\n", "epoch: 180, batch: 300 // loss: 0.049\n", "epoch: 180, batch: 400 // loss: 0.046\n", "epoch: 180, batch: 500 // loss: 0.040\n", "epoch: 180, batch: 600 // loss: 0.040\n", "epoch: 180, batch: 700 // loss: 0.044\n", "epoch: 180, batch: 800 // loss: 0.042\n", "epoch: 180, batch: 900 // loss: 0.049\n", "epoch: 180, batch: 1000 // loss: 0.046\n", "epoch: 180, batch: 1100 // loss: 0.042\n", "epoch: 180, batch: 1200 // loss: 0.044\n", "epoch: 180, batch: 1300 // loss: 0.046\n", "epoch: 180, batch: 1400 // loss: 0.043\n", "epoch: 180, batch: 1500 // loss: 0.048\n", "epoch: 180, batch: 1600 // loss: 0.052\n", "epoch: 180, batch: 1700 // loss: 0.045\n", "epoch: 180, batch: 1800 // loss: 0.053\n", "epoch: 180, batch: 1900 // loss: 0.045\n", "epoch: 180, batch: 2000 // loss: 0.047\n", "epoch: 180, batch: 2100 // loss: 0.046\n", "epoch: 180, batch: 2200 // loss: 0.050\n", "epoch: 180, batch: 2300 // loss: 0.049\n", "epoch: 180, batch: 2400 // loss: 0.042\n", "epoch: 180, batch: 2500 // loss: 0.042\n", "epoch: 180, batch: 2600 // loss: 0.045\n", "epoch: 180, batch: 2700 // loss: 0.042\n", "epoch: 180, batch: 2800 // loss: 0.046\n", "epoch: 180, batch: 2900 // loss: 0.042\n", "epoch: 180, batch: 3000 // loss: 0.045\n", "epoch: 180, batch: 3100 // loss: 0.043\n", "epoch: 180, batch: 3200 // loss: 0.039\n", "epoch: 180, batch: 3300 // loss: 0.038\n", "epoch: 180, batch: 3400 // loss: 0.044\n", "epoch: 180, batch: 3500 // loss: 0.035\n", "epoch: 180, batch: 3600 // loss: 0.043\n", "epoch: 180, batch: 3700 // loss: 0.043\n", "\n", "epoch: 181, batch: 0 // loss: 0.053\n", "epoch: 181, batch: 100 // loss: 0.046\n", "epoch: 181, batch: 200 // loss: 0.043\n", "epoch: 181, batch: 300 // loss: 0.049\n", "epoch: 181, batch: 400 // loss: 0.046\n", "epoch: 181, batch: 500 // loss: 0.040\n", "epoch: 181, batch: 600 // loss: 0.040\n", "epoch: 181, batch: 700 // loss: 0.044\n", "epoch: 181, batch: 800 // loss: 0.042\n", "epoch: 181, batch: 900 // loss: 0.049\n", "epoch: 181, batch: 1000 // loss: 0.046\n", "epoch: 181, batch: 1100 // loss: 0.042\n", "epoch: 181, batch: 1200 // loss: 0.044\n", "epoch: 181, batch: 1300 // loss: 0.046\n", "epoch: 181, batch: 1400 // loss: 0.043\n", "epoch: 181, batch: 1500 // loss: 0.048\n", "epoch: 181, batch: 1600 // loss: 0.052\n", "epoch: 181, batch: 1700 // loss: 0.045\n", "epoch: 181, batch: 1800 // loss: 0.053\n", "epoch: 181, batch: 1900 // loss: 0.045\n", "epoch: 181, batch: 2000 // loss: 0.047\n", "epoch: 181, batch: 2100 // loss: 0.046\n", "epoch: 181, batch: 2200 // loss: 0.050\n", "epoch: 181, batch: 2300 // loss: 0.049\n", "epoch: 181, batch: 2400 // loss: 0.042\n", "epoch: 181, batch: 2500 // loss: 0.042\n", "epoch: 181, batch: 2600 // loss: 0.045\n", "epoch: 181, batch: 2700 // loss: 0.042\n", "epoch: 181, batch: 2800 // loss: 0.046\n", "epoch: 181, batch: 2900 // loss: 0.042\n", "epoch: 181, batch: 3000 // loss: 0.045\n", "epoch: 181, batch: 3100 // loss: 0.043\n", "epoch: 181, batch: 3200 // loss: 0.039\n", "epoch: 181, batch: 3300 // loss: 0.038\n", "epoch: 181, batch: 3400 // loss: 0.044\n", "epoch: 181, batch: 3500 // loss: 0.035\n", "epoch: 181, batch: 3600 // loss: 0.043\n", "epoch: 181, batch: 3700 // loss: 0.043\n", "\n", "epoch: 182, batch: 0 // loss: 0.053\n", "epoch: 182, batch: 100 // loss: 0.046\n", "epoch: 182, batch: 200 // loss: 0.043\n", "epoch: 182, batch: 300 // loss: 0.049\n", "epoch: 182, batch: 400 // loss: 0.046\n", "epoch: 182, batch: 500 // loss: 0.040\n", "epoch: 182, batch: 600 // loss: 0.040\n", "epoch: 182, batch: 700 // loss: 0.044\n", "epoch: 182, batch: 800 // loss: 0.042\n", "epoch: 182, batch: 900 // loss: 0.049\n", "epoch: 182, batch: 1000 // loss: 0.046\n", "epoch: 182, batch: 1100 // loss: 0.042\n", "epoch: 182, batch: 1200 // loss: 0.044\n", "epoch: 182, batch: 1300 // loss: 0.046\n", "epoch: 182, batch: 1400 // loss: 0.043\n", "epoch: 182, batch: 1500 // loss: 0.048\n", "epoch: 182, batch: 1600 // loss: 0.052\n", "epoch: 182, batch: 1700 // loss: 0.045\n", "epoch: 182, batch: 1800 // loss: 0.053\n", "epoch: 182, batch: 1900 // loss: 0.045\n", "epoch: 182, batch: 2000 // loss: 0.047\n", "epoch: 182, batch: 2100 // loss: 0.046\n", "epoch: 182, batch: 2200 // loss: 0.050\n", "epoch: 182, batch: 2300 // loss: 0.049\n", "epoch: 182, batch: 2400 // loss: 0.042\n", "epoch: 182, batch: 2500 // loss: 0.042\n", "epoch: 182, batch: 2600 // loss: 0.045\n", "epoch: 182, batch: 2700 // loss: 0.042\n", "epoch: 182, batch: 2800 // loss: 0.046\n", "epoch: 182, batch: 2900 // loss: 0.042\n", "epoch: 182, batch: 3000 // loss: 0.045\n", "epoch: 182, batch: 3100 // loss: 0.043\n", "epoch: 182, batch: 3200 // loss: 0.039\n", "epoch: 182, batch: 3300 // loss: 0.038\n", "epoch: 182, batch: 3400 // loss: 0.044\n", "epoch: 182, batch: 3500 // loss: 0.035\n", "epoch: 182, batch: 3600 // loss: 0.043\n", "epoch: 182, batch: 3700 // loss: 0.043\n", "\n", "epoch: 183, batch: 0 // loss: 0.053\n", "epoch: 183, batch: 100 // loss: 0.046\n", "epoch: 183, batch: 200 // loss: 0.043\n", "epoch: 183, batch: 300 // loss: 0.049\n", "epoch: 183, batch: 400 // loss: 0.046\n", "epoch: 183, batch: 500 // loss: 0.040\n", "epoch: 183, batch: 600 // loss: 0.040\n", "epoch: 183, batch: 700 // loss: 0.044\n", "epoch: 183, batch: 800 // loss: 0.042\n", "epoch: 183, batch: 900 // loss: 0.049\n", "epoch: 183, batch: 1000 // loss: 0.046\n", "epoch: 183, batch: 1100 // loss: 0.042\n", "epoch: 183, batch: 1200 // loss: 0.044\n", "epoch: 183, batch: 1300 // loss: 0.046\n", "epoch: 183, batch: 1400 // loss: 0.043\n", "epoch: 183, batch: 1500 // loss: 0.048\n", "epoch: 183, batch: 1600 // loss: 0.052\n", "epoch: 183, batch: 1700 // loss: 0.045\n", "epoch: 183, batch: 1800 // loss: 0.053\n", "epoch: 183, batch: 1900 // loss: 0.045\n", "epoch: 183, batch: 2000 // loss: 0.047\n", "epoch: 183, batch: 2100 // loss: 0.046\n", "epoch: 183, batch: 2200 // loss: 0.050\n", "epoch: 183, batch: 2300 // loss: 0.049\n", "epoch: 183, batch: 2400 // loss: 0.042\n", "epoch: 183, batch: 2500 // loss: 0.042\n", "epoch: 183, batch: 2600 // loss: 0.045\n", "epoch: 183, batch: 2700 // loss: 0.042\n", "epoch: 183, batch: 2800 // loss: 0.046\n", "epoch: 183, batch: 2900 // loss: 0.042\n", "epoch: 183, batch: 3000 // loss: 0.045\n", "epoch: 183, batch: 3100 // loss: 0.043\n", "epoch: 183, batch: 3200 // loss: 0.039\n", "epoch: 183, batch: 3300 // loss: 0.038\n", "epoch: 183, batch: 3400 // loss: 0.044\n", "epoch: 183, batch: 3500 // loss: 0.035\n", "epoch: 183, batch: 3600 // loss: 0.043\n", "epoch: 183, batch: 3700 // loss: 0.043\n", "\n", "epoch: 184, batch: 0 // loss: 0.053\n", "epoch: 184, batch: 100 // loss: 0.046\n", "epoch: 184, batch: 200 // loss: 0.043\n", "epoch: 184, batch: 300 // loss: 0.049\n", "epoch: 184, batch: 400 // loss: 0.046\n", "epoch: 184, batch: 500 // loss: 0.040\n", "epoch: 184, batch: 600 // loss: 0.040\n", "epoch: 184, batch: 700 // loss: 0.044\n", "epoch: 184, batch: 800 // loss: 0.042\n", "epoch: 184, batch: 900 // loss: 0.049\n", "epoch: 184, batch: 1000 // loss: 0.046\n", "epoch: 184, batch: 1100 // loss: 0.042\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 184, batch: 1200 // loss: 0.044\n", "epoch: 184, batch: 1300 // loss: 0.046\n", "epoch: 184, batch: 1400 // loss: 0.043\n", "epoch: 184, batch: 1500 // loss: 0.048\n", "epoch: 184, batch: 1600 // loss: 0.052\n", "epoch: 184, batch: 1700 // loss: 0.045\n", "epoch: 184, batch: 1800 // loss: 0.053\n", "epoch: 184, batch: 1900 // loss: 0.045\n", "epoch: 184, batch: 2000 // loss: 0.047\n", "epoch: 184, batch: 2100 // loss: 0.046\n", "epoch: 184, batch: 2200 // loss: 0.050\n", "epoch: 184, batch: 2300 // loss: 0.049\n", "epoch: 184, batch: 2400 // loss: 0.042\n", "epoch: 184, batch: 2500 // loss: 0.042\n", "epoch: 184, batch: 2600 // loss: 0.045\n", "epoch: 184, batch: 2700 // loss: 0.042\n", "epoch: 184, batch: 2800 // loss: 0.046\n", "epoch: 184, batch: 2900 // loss: 0.042\n", "epoch: 184, batch: 3000 // loss: 0.045\n", "epoch: 184, batch: 3100 // loss: 0.043\n", "epoch: 184, batch: 3200 // loss: 0.039\n", "epoch: 184, batch: 3300 // loss: 0.038\n", "epoch: 184, batch: 3400 // loss: 0.044\n", "epoch: 184, batch: 3500 // loss: 0.035\n", "epoch: 184, batch: 3600 // loss: 0.043\n", "epoch: 184, batch: 3700 // loss: 0.043\n", "\n", "epoch: 185, batch: 0 // loss: 0.053\n", "epoch: 185, batch: 100 // loss: 0.046\n", "epoch: 185, batch: 200 // loss: 0.043\n", "epoch: 185, batch: 300 // loss: 0.049\n", "epoch: 185, batch: 400 // loss: 0.046\n", "epoch: 185, batch: 500 // loss: 0.040\n", "epoch: 185, batch: 600 // loss: 0.040\n", "epoch: 185, batch: 700 // loss: 0.044\n", "epoch: 185, batch: 800 // loss: 0.042\n", "epoch: 185, batch: 900 // loss: 0.049\n", "epoch: 185, batch: 1000 // loss: 0.046\n", "epoch: 185, batch: 1100 // loss: 0.042\n", "epoch: 185, batch: 1200 // loss: 0.044\n", "epoch: 185, batch: 1300 // loss: 0.046\n", "epoch: 185, batch: 1400 // loss: 0.043\n", "epoch: 185, batch: 1500 // loss: 0.048\n", "epoch: 185, batch: 1600 // loss: 0.052\n", "epoch: 185, batch: 1700 // loss: 0.045\n", "epoch: 185, batch: 1800 // loss: 0.053\n", "epoch: 185, batch: 1900 // loss: 0.045\n", "epoch: 185, batch: 2000 // loss: 0.047\n", "epoch: 185, batch: 2100 // loss: 0.046\n", "epoch: 185, batch: 2200 // loss: 0.050\n", "epoch: 185, batch: 2300 // loss: 0.049\n", "epoch: 185, batch: 2400 // loss: 0.042\n", "epoch: 185, batch: 2500 // loss: 0.042\n", "epoch: 185, batch: 2600 // loss: 0.045\n", "epoch: 185, batch: 2700 // loss: 0.042\n", "epoch: 185, batch: 2800 // loss: 0.046\n", "epoch: 185, batch: 2900 // loss: 0.042\n", "epoch: 185, batch: 3000 // loss: 0.045\n", "epoch: 185, batch: 3100 // loss: 0.043\n", "epoch: 185, batch: 3200 // loss: 0.039\n", "epoch: 185, batch: 3300 // loss: 0.038\n", "epoch: 185, batch: 3400 // loss: 0.044\n", "epoch: 185, batch: 3500 // loss: 0.035\n", "epoch: 185, batch: 3600 // loss: 0.043\n", "epoch: 185, batch: 3700 // loss: 0.043\n", "\n", "epoch: 186, batch: 0 // loss: 0.053\n", "epoch: 186, batch: 100 // loss: 0.046\n", "epoch: 186, batch: 200 // loss: 0.043\n", "epoch: 186, batch: 300 // loss: 0.049\n", "epoch: 186, batch: 400 // loss: 0.046\n", "epoch: 186, batch: 500 // loss: 0.040\n", "epoch: 186, batch: 600 // loss: 0.040\n", "epoch: 186, batch: 700 // loss: 0.044\n", "epoch: 186, batch: 800 // loss: 0.042\n", "epoch: 186, batch: 900 // loss: 0.049\n", "epoch: 186, batch: 1000 // loss: 0.046\n", "epoch: 186, batch: 1100 // loss: 0.042\n", "epoch: 186, batch: 1200 // loss: 0.044\n", "epoch: 186, batch: 1300 // loss: 0.046\n", "epoch: 186, batch: 1400 // loss: 0.043\n", "epoch: 186, batch: 1500 // loss: 0.048\n", "epoch: 186, batch: 1600 // loss: 0.052\n", "epoch: 186, batch: 1700 // loss: 0.045\n", "epoch: 186, batch: 1800 // loss: 0.053\n", "epoch: 186, batch: 1900 // loss: 0.045\n", "epoch: 186, batch: 2000 // loss: 0.047\n", "epoch: 186, batch: 2100 // loss: 0.046\n", "epoch: 186, batch: 2200 // loss: 0.050\n", "epoch: 186, batch: 2300 // loss: 0.049\n", "epoch: 186, batch: 2400 // loss: 0.042\n", "epoch: 186, batch: 2500 // loss: 0.042\n", "epoch: 186, batch: 2600 // loss: 0.045\n", "epoch: 186, batch: 2700 // loss: 0.042\n", "epoch: 186, batch: 2800 // loss: 0.046\n", "epoch: 186, batch: 2900 // loss: 0.042\n", "epoch: 186, batch: 3000 // loss: 0.045\n", "epoch: 186, batch: 3100 // loss: 0.043\n", "epoch: 186, batch: 3200 // loss: 0.039\n", "epoch: 186, batch: 3300 // loss: 0.038\n", "epoch: 186, batch: 3400 // loss: 0.044\n", "epoch: 186, batch: 3500 // loss: 0.035\n", "epoch: 186, batch: 3600 // loss: 0.043\n", "epoch: 186, batch: 3700 // loss: 0.043\n", "\n", "epoch: 187, batch: 0 // loss: 0.053\n", "epoch: 187, batch: 100 // loss: 0.046\n", "epoch: 187, batch: 200 // loss: 0.043\n", "epoch: 187, batch: 300 // loss: 0.049\n", "epoch: 187, batch: 400 // loss: 0.046\n", "epoch: 187, batch: 500 // loss: 0.040\n", "epoch: 187, batch: 600 // loss: 0.040\n", "epoch: 187, batch: 700 // loss: 0.044\n", "epoch: 187, batch: 800 // loss: 0.042\n", "epoch: 187, batch: 900 // loss: 0.049\n", "epoch: 187, batch: 1000 // loss: 0.046\n", "epoch: 187, batch: 1100 // loss: 0.042\n", "epoch: 187, batch: 1200 // loss: 0.044\n", "epoch: 187, batch: 1300 // loss: 0.046\n", "epoch: 187, batch: 1400 // loss: 0.043\n", "epoch: 187, batch: 1500 // loss: 0.048\n", "epoch: 187, batch: 1600 // loss: 0.052\n", "epoch: 187, batch: 1700 // loss: 0.045\n", "epoch: 187, batch: 1800 // loss: 0.053\n", "epoch: 187, batch: 1900 // loss: 0.045\n", "epoch: 187, batch: 2000 // loss: 0.047\n", "epoch: 187, batch: 2100 // loss: 0.046\n", "epoch: 187, batch: 2200 // loss: 0.050\n", "epoch: 187, batch: 2300 // loss: 0.049\n", "epoch: 187, batch: 2400 // loss: 0.042\n", "epoch: 187, batch: 2500 // loss: 0.042\n", "epoch: 187, batch: 2600 // loss: 0.045\n", "epoch: 187, batch: 2700 // loss: 0.042\n", "epoch: 187, batch: 2800 // loss: 0.046\n", "epoch: 187, batch: 2900 // loss: 0.042\n", "epoch: 187, batch: 3000 // loss: 0.045\n", "epoch: 187, batch: 3100 // loss: 0.043\n", "epoch: 187, batch: 3200 // loss: 0.039\n", "epoch: 187, batch: 3300 // loss: 0.038\n", "epoch: 187, batch: 3400 // loss: 0.044\n", "epoch: 187, batch: 3500 // loss: 0.035\n", "epoch: 187, batch: 3600 // loss: 0.043\n", "epoch: 187, batch: 3700 // loss: 0.043\n", "\n", "epoch: 188, batch: 0 // loss: 0.053\n", "epoch: 188, batch: 100 // loss: 0.046\n", "epoch: 188, batch: 200 // loss: 0.043\n", "epoch: 188, batch: 300 // loss: 0.049\n", "epoch: 188, batch: 400 // loss: 0.046\n", "epoch: 188, batch: 500 // loss: 0.040\n", "epoch: 188, batch: 600 // loss: 0.040\n", "epoch: 188, batch: 700 // loss: 0.044\n", "epoch: 188, batch: 800 // loss: 0.042\n", "epoch: 188, batch: 900 // loss: 0.049\n", "epoch: 188, batch: 1000 // loss: 0.046\n", "epoch: 188, batch: 1100 // loss: 0.042\n", "epoch: 188, batch: 1200 // loss: 0.044\n", "epoch: 188, batch: 1300 // loss: 0.046\n", "epoch: 188, batch: 1400 // loss: 0.043\n", "epoch: 188, batch: 1500 // loss: 0.048\n", "epoch: 188, batch: 1600 // loss: 0.052\n", "epoch: 188, batch: 1700 // loss: 0.045\n", "epoch: 188, batch: 1800 // loss: 0.053\n", "epoch: 188, batch: 1900 // loss: 0.045\n", "epoch: 188, batch: 2000 // loss: 0.047\n", "epoch: 188, batch: 2100 // loss: 0.046\n", "epoch: 188, batch: 2200 // loss: 0.050\n", "epoch: 188, batch: 2300 // loss: 0.049\n", "epoch: 188, batch: 2400 // loss: 0.042\n", "epoch: 188, batch: 2500 // loss: 0.042\n", "epoch: 188, batch: 2600 // loss: 0.045\n", "epoch: 188, batch: 2700 // loss: 0.042\n", "epoch: 188, batch: 2800 // loss: 0.046\n", "epoch: 188, batch: 2900 // loss: 0.042\n", "epoch: 188, batch: 3000 // loss: 0.045\n", "epoch: 188, batch: 3100 // loss: 0.043\n", "epoch: 188, batch: 3200 // loss: 0.039\n", "epoch: 188, batch: 3300 // loss: 0.038\n", "epoch: 188, batch: 3400 // loss: 0.044\n", "epoch: 188, batch: 3500 // loss: 0.035\n", "epoch: 188, batch: 3600 // loss: 0.043\n", "epoch: 188, batch: 3700 // loss: 0.043\n", "\n", "epoch: 189, batch: 0 // loss: 0.053\n", "epoch: 189, batch: 100 // loss: 0.046\n", "epoch: 189, batch: 200 // loss: 0.043\n", "epoch: 189, batch: 300 // loss: 0.049\n", "epoch: 189, batch: 400 // loss: 0.046\n", "epoch: 189, batch: 500 // loss: 0.040\n", "epoch: 189, batch: 600 // loss: 0.040\n", "epoch: 189, batch: 700 // loss: 0.044\n", "epoch: 189, batch: 800 // loss: 0.042\n", "epoch: 189, batch: 900 // loss: 0.049\n", "epoch: 189, batch: 1000 // loss: 0.046\n", "epoch: 189, batch: 1100 // loss: 0.042\n", "epoch: 189, batch: 1200 // loss: 0.044\n", "epoch: 189, batch: 1300 // loss: 0.046\n", "epoch: 189, batch: 1400 // loss: 0.043\n", "epoch: 189, batch: 1500 // loss: 0.048\n", "epoch: 189, batch: 1600 // loss: 0.052\n", "epoch: 189, batch: 1700 // loss: 0.045\n", "epoch: 189, batch: 1800 // loss: 0.053\n", "epoch: 189, batch: 1900 // loss: 0.045\n", "epoch: 189, batch: 2000 // loss: 0.047\n", "epoch: 189, batch: 2100 // loss: 0.046\n", "epoch: 189, batch: 2200 // loss: 0.050\n", "epoch: 189, batch: 2300 // loss: 0.049\n", "epoch: 189, batch: 2400 // loss: 0.042\n", "epoch: 189, batch: 2500 // loss: 0.042\n", "epoch: 189, batch: 2600 // loss: 0.045\n", "epoch: 189, batch: 2700 // loss: 0.042\n", "epoch: 189, batch: 2800 // loss: 0.046\n", "epoch: 189, batch: 2900 // loss: 0.042\n", "epoch: 189, batch: 3000 // loss: 0.045\n", "epoch: 189, batch: 3100 // loss: 0.043\n", "epoch: 189, batch: 3200 // loss: 0.039\n", "epoch: 189, batch: 3300 // loss: 0.038\n", "epoch: 189, batch: 3400 // loss: 0.044\n", "epoch: 189, batch: 3500 // loss: 0.035\n", "epoch: 189, batch: 3600 // loss: 0.043\n", "epoch: 189, batch: 3700 // loss: 0.043\n", "\n", "epoch: 190, batch: 0 // loss: 0.053\n", "epoch: 190, batch: 100 // loss: 0.046\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 190, batch: 200 // loss: 0.043\n", "epoch: 190, batch: 300 // loss: 0.049\n", "epoch: 190, batch: 400 // loss: 0.046\n", "epoch: 190, batch: 500 // loss: 0.040\n", "epoch: 190, batch: 600 // loss: 0.040\n", "epoch: 190, batch: 700 // loss: 0.044\n", "epoch: 190, batch: 800 // loss: 0.042\n", "epoch: 190, batch: 900 // loss: 0.049\n", "epoch: 190, batch: 1000 // loss: 0.046\n", "epoch: 190, batch: 1100 // loss: 0.042\n", "epoch: 190, batch: 1200 // loss: 0.044\n", "epoch: 190, batch: 1300 // loss: 0.046\n", "epoch: 190, batch: 1400 // loss: 0.043\n", "epoch: 190, batch: 1500 // loss: 0.048\n", "epoch: 190, batch: 1600 // loss: 0.052\n", "epoch: 190, batch: 1700 // loss: 0.045\n", "epoch: 190, batch: 1800 // loss: 0.053\n", "epoch: 190, batch: 1900 // loss: 0.045\n", "epoch: 190, batch: 2000 // loss: 0.047\n", "epoch: 190, batch: 2100 // loss: 0.046\n", "epoch: 190, batch: 2200 // loss: 0.050\n", "epoch: 190, batch: 2300 // loss: 0.049\n", "epoch: 190, batch: 2400 // loss: 0.042\n", "epoch: 190, batch: 2500 // loss: 0.042\n", "epoch: 190, batch: 2600 // loss: 0.045\n", "epoch: 190, batch: 2700 // loss: 0.042\n", "epoch: 190, batch: 2800 // loss: 0.046\n", "epoch: 190, batch: 2900 // loss: 0.042\n", "epoch: 190, batch: 3000 // loss: 0.045\n", "epoch: 190, batch: 3100 // loss: 0.043\n", "epoch: 190, batch: 3200 // loss: 0.039\n", "epoch: 190, batch: 3300 // loss: 0.038\n", "epoch: 190, batch: 3400 // loss: 0.044\n", "epoch: 190, batch: 3500 // loss: 0.035\n", "epoch: 190, batch: 3600 // loss: 0.043\n", "epoch: 190, batch: 3700 // loss: 0.043\n", "\n", "epoch: 191, batch: 0 // loss: 0.053\n", "epoch: 191, batch: 100 // loss: 0.046\n", "epoch: 191, batch: 200 // loss: 0.043\n", "epoch: 191, batch: 300 // loss: 0.049\n", "epoch: 191, batch: 400 // loss: 0.046\n", "epoch: 191, batch: 500 // loss: 0.040\n", "epoch: 191, batch: 600 // loss: 0.040\n", "epoch: 191, batch: 700 // loss: 0.044\n", "epoch: 191, batch: 800 // loss: 0.042\n", "epoch: 191, batch: 900 // loss: 0.049\n", "epoch: 191, batch: 1000 // loss: 0.046\n", "epoch: 191, batch: 1100 // loss: 0.042\n", "epoch: 191, batch: 1200 // loss: 0.044\n", "epoch: 191, batch: 1300 // loss: 0.046\n", "epoch: 191, batch: 1400 // loss: 0.043\n", "epoch: 191, batch: 1500 // loss: 0.048\n", "epoch: 191, batch: 1600 // loss: 0.052\n", "epoch: 191, batch: 1700 // loss: 0.045\n", "epoch: 191, batch: 1800 // loss: 0.053\n", "epoch: 191, batch: 1900 // loss: 0.045\n", "epoch: 191, batch: 2000 // loss: 0.047\n", "epoch: 191, batch: 2100 // loss: 0.046\n", "epoch: 191, batch: 2200 // loss: 0.050\n", "epoch: 191, batch: 2300 // loss: 0.049\n", "epoch: 191, batch: 2400 // loss: 0.042\n", "epoch: 191, batch: 2500 // loss: 0.042\n", "epoch: 191, batch: 2600 // loss: 0.045\n", "epoch: 191, batch: 2700 // loss: 0.042\n", "epoch: 191, batch: 2800 // loss: 0.046\n", "epoch: 191, batch: 2900 // loss: 0.042\n", "epoch: 191, batch: 3000 // loss: 0.045\n", "epoch: 191, batch: 3100 // loss: 0.043\n", "epoch: 191, batch: 3200 // loss: 0.039\n", "epoch: 191, batch: 3300 // loss: 0.038\n", "epoch: 191, batch: 3400 // loss: 0.044\n", "epoch: 191, batch: 3500 // loss: 0.035\n", "epoch: 191, batch: 3600 // loss: 0.043\n", "epoch: 191, batch: 3700 // loss: 0.043\n", "\n", "epoch: 192, batch: 0 // loss: 0.053\n", "epoch: 192, batch: 100 // loss: 0.046\n", "epoch: 192, batch: 200 // loss: 0.043\n", "epoch: 192, batch: 300 // loss: 0.049\n", "epoch: 192, batch: 400 // loss: 0.046\n", "epoch: 192, batch: 500 // loss: 0.040\n", "epoch: 192, batch: 600 // loss: 0.040\n", "epoch: 192, batch: 700 // loss: 0.044\n", "epoch: 192, batch: 800 // loss: 0.042\n", "epoch: 192, batch: 900 // loss: 0.049\n", "epoch: 192, batch: 1000 // loss: 0.046\n", "epoch: 192, batch: 1100 // loss: 0.042\n", "epoch: 192, batch: 1200 // loss: 0.044\n", "epoch: 192, batch: 1300 // loss: 0.046\n", "epoch: 192, batch: 1400 // loss: 0.043\n", "epoch: 192, batch: 1500 // loss: 0.048\n", "epoch: 192, batch: 1600 // loss: 0.052\n", "epoch: 192, batch: 1700 // loss: 0.045\n", "epoch: 192, batch: 1800 // loss: 0.053\n", "epoch: 192, batch: 1900 // loss: 0.045\n", "epoch: 192, batch: 2000 // loss: 0.047\n", "epoch: 192, batch: 2100 // loss: 0.046\n", "epoch: 192, batch: 2200 // loss: 0.050\n", "epoch: 192, batch: 2300 // loss: 0.049\n", "epoch: 192, batch: 2400 // loss: 0.042\n", "epoch: 192, batch: 2500 // loss: 0.042\n", "epoch: 192, batch: 2600 // loss: 0.045\n", "epoch: 192, batch: 2700 // loss: 0.042\n", "epoch: 192, batch: 2800 // loss: 0.046\n", "epoch: 192, batch: 2900 // loss: 0.042\n", "epoch: 192, batch: 3000 // loss: 0.045\n", "epoch: 192, batch: 3100 // loss: 0.043\n", "epoch: 192, batch: 3200 // loss: 0.039\n", "epoch: 192, batch: 3300 // loss: 0.038\n", "epoch: 192, batch: 3400 // loss: 0.044\n", "epoch: 192, batch: 3500 // loss: 0.035\n", "epoch: 192, batch: 3600 // loss: 0.043\n", "epoch: 192, batch: 3700 // loss: 0.043\n", "\n", "epoch: 193, batch: 0 // loss: 0.053\n", "epoch: 193, batch: 100 // loss: 0.046\n", "epoch: 193, batch: 200 // loss: 0.043\n", "epoch: 193, batch: 300 // loss: 0.049\n", "epoch: 193, batch: 400 // loss: 0.046\n", "epoch: 193, batch: 500 // loss: 0.040\n", "epoch: 193, batch: 600 // loss: 0.040\n", "epoch: 193, batch: 700 // loss: 0.044\n", "epoch: 193, batch: 800 // loss: 0.042\n", "epoch: 193, batch: 900 // loss: 0.049\n", "epoch: 193, batch: 1000 // loss: 0.046\n", "epoch: 193, batch: 1100 // loss: 0.042\n", "epoch: 193, batch: 1200 // loss: 0.044\n", "epoch: 193, batch: 1300 // loss: 0.046\n", "epoch: 193, batch: 1400 // loss: 0.043\n", "epoch: 193, batch: 1500 // loss: 0.048\n", "epoch: 193, batch: 1600 // loss: 0.052\n", "epoch: 193, batch: 1700 // loss: 0.045\n", "epoch: 193, batch: 1800 // loss: 0.053\n", "epoch: 193, batch: 1900 // loss: 0.045\n", "epoch: 193, batch: 2000 // loss: 0.047\n", "epoch: 193, batch: 2100 // loss: 0.046\n", "epoch: 193, batch: 2200 // loss: 0.050\n", "epoch: 193, batch: 2300 // loss: 0.049\n", "epoch: 193, batch: 2400 // loss: 0.042\n", "epoch: 193, batch: 2500 // loss: 0.042\n", "epoch: 193, batch: 2600 // loss: 0.045\n", "epoch: 193, batch: 2700 // loss: 0.042\n", "epoch: 193, batch: 2800 // loss: 0.046\n", "epoch: 193, batch: 2900 // loss: 0.042\n", "epoch: 193, batch: 3000 // loss: 0.045\n", "epoch: 193, batch: 3100 // loss: 0.043\n", "epoch: 193, batch: 3200 // loss: 0.039\n", "epoch: 193, batch: 3300 // loss: 0.038\n", "epoch: 193, batch: 3400 // loss: 0.044\n", "epoch: 193, batch: 3500 // loss: 0.035\n", "epoch: 193, batch: 3600 // loss: 0.043\n", "epoch: 193, batch: 3700 // loss: 0.043\n", "\n", "epoch: 194, batch: 0 // loss: 0.053\n", "epoch: 194, batch: 100 // loss: 0.046\n", "epoch: 194, batch: 200 // loss: 0.043\n", "epoch: 194, batch: 300 // loss: 0.049\n", "epoch: 194, batch: 400 // loss: 0.046\n", "epoch: 194, batch: 500 // loss: 0.040\n", "epoch: 194, batch: 600 // loss: 0.040\n", "epoch: 194, batch: 700 // loss: 0.044\n", "epoch: 194, batch: 800 // loss: 0.042\n", "epoch: 194, batch: 900 // loss: 0.049\n", "epoch: 194, batch: 1000 // loss: 0.046\n", "epoch: 194, batch: 1100 // loss: 0.042\n", "epoch: 194, batch: 1200 // loss: 0.044\n", "epoch: 194, batch: 1300 // loss: 0.046\n", "epoch: 194, batch: 1400 // loss: 0.043\n", "epoch: 194, batch: 1500 // loss: 0.048\n", "epoch: 194, batch: 1600 // loss: 0.052\n", "epoch: 194, batch: 1700 // loss: 0.045\n", "epoch: 194, batch: 1800 // loss: 0.053\n", "epoch: 194, batch: 1900 // loss: 0.045\n", "epoch: 194, batch: 2000 // loss: 0.047\n", "epoch: 194, batch: 2100 // loss: 0.046\n", "epoch: 194, batch: 2200 // loss: 0.050\n", "epoch: 194, batch: 2300 // loss: 0.049\n", "epoch: 194, batch: 2400 // loss: 0.042\n", "epoch: 194, batch: 2500 // loss: 0.042\n", "epoch: 194, batch: 2600 // loss: 0.045\n", "epoch: 194, batch: 2700 // loss: 0.042\n", "epoch: 194, batch: 2800 // loss: 0.046\n", "epoch: 194, batch: 2900 // loss: 0.042\n", "epoch: 194, batch: 3000 // loss: 0.045\n", "epoch: 194, batch: 3100 // loss: 0.043\n", "epoch: 194, batch: 3200 // loss: 0.039\n", "epoch: 194, batch: 3300 // loss: 0.038\n", "epoch: 194, batch: 3400 // loss: 0.044\n", "epoch: 194, batch: 3500 // loss: 0.035\n", "epoch: 194, batch: 3600 // loss: 0.043\n", "epoch: 194, batch: 3700 // loss: 0.043\n", "\n", "epoch: 195, batch: 0 // loss: 0.053\n", "epoch: 195, batch: 100 // loss: 0.046\n", "epoch: 195, batch: 200 // loss: 0.043\n", "epoch: 195, batch: 300 // loss: 0.049\n", "epoch: 195, batch: 400 // loss: 0.046\n", "epoch: 195, batch: 500 // loss: 0.040\n", "epoch: 195, batch: 600 // loss: 0.040\n", "epoch: 195, batch: 700 // loss: 0.044\n", "epoch: 195, batch: 800 // loss: 0.042\n", "epoch: 195, batch: 900 // loss: 0.049\n", "epoch: 195, batch: 1000 // loss: 0.046\n", "epoch: 195, batch: 1100 // loss: 0.042\n", "epoch: 195, batch: 1200 // loss: 0.044\n", "epoch: 195, batch: 1300 // loss: 0.046\n", "epoch: 195, batch: 1400 // loss: 0.043\n", "epoch: 195, batch: 1500 // loss: 0.048\n", "epoch: 195, batch: 1600 // loss: 0.052\n", "epoch: 195, batch: 1700 // loss: 0.045\n", "epoch: 195, batch: 1800 // loss: 0.053\n", "epoch: 195, batch: 1900 // loss: 0.045\n", "epoch: 195, batch: 2000 // loss: 0.047\n", "epoch: 195, batch: 2100 // loss: 0.046\n", "epoch: 195, batch: 2200 // loss: 0.050\n", "epoch: 195, batch: 2300 // loss: 0.049\n", "epoch: 195, batch: 2400 // loss: 0.042\n", "epoch: 195, batch: 2500 // loss: 0.042\n", "epoch: 195, batch: 2600 // loss: 0.045\n", "epoch: 195, batch: 2700 // loss: 0.042\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 195, batch: 2800 // loss: 0.046\n", "epoch: 195, batch: 2900 // loss: 0.042\n", "epoch: 195, batch: 3000 // loss: 0.045\n", "epoch: 195, batch: 3100 // loss: 0.043\n", "epoch: 195, batch: 3200 // loss: 0.039\n", "epoch: 195, batch: 3300 // loss: 0.038\n", "epoch: 195, batch: 3400 // loss: 0.044\n", "epoch: 195, batch: 3500 // loss: 0.035\n", "epoch: 195, batch: 3600 // loss: 0.043\n", "epoch: 195, batch: 3700 // loss: 0.043\n", "\n", "epoch: 196, batch: 0 // loss: 0.053\n", "epoch: 196, batch: 100 // loss: 0.046\n", "epoch: 196, batch: 200 // loss: 0.043\n", "epoch: 196, batch: 300 // loss: 0.049\n", "epoch: 196, batch: 400 // loss: 0.046\n", "epoch: 196, batch: 500 // loss: 0.040\n", "epoch: 196, batch: 600 // loss: 0.040\n", "epoch: 196, batch: 700 // loss: 0.044\n", "epoch: 196, batch: 800 // loss: 0.042\n", "epoch: 196, batch: 900 // loss: 0.049\n", "epoch: 196, batch: 1000 // loss: 0.046\n", "epoch: 196, batch: 1100 // loss: 0.042\n", "epoch: 196, batch: 1200 // loss: 0.044\n", "epoch: 196, batch: 1300 // loss: 0.046\n", "epoch: 196, batch: 1400 // loss: 0.043\n", "epoch: 196, batch: 1500 // loss: 0.048\n", "epoch: 196, batch: 1600 // loss: 0.052\n", "epoch: 196, batch: 1700 // loss: 0.045\n", "epoch: 196, batch: 1800 // loss: 0.053\n", "epoch: 196, batch: 1900 // loss: 0.045\n", "epoch: 196, batch: 2000 // loss: 0.047\n", "epoch: 196, batch: 2100 // loss: 0.046\n", "epoch: 196, batch: 2200 // loss: 0.050\n", "epoch: 196, batch: 2300 // loss: 0.049\n", "epoch: 196, batch: 2400 // loss: 0.042\n", "epoch: 196, batch: 2500 // loss: 0.042\n", "epoch: 196, batch: 2600 // loss: 0.045\n", "epoch: 196, batch: 2700 // loss: 0.042\n", "epoch: 196, batch: 2800 // loss: 0.046\n", "epoch: 196, batch: 2900 // loss: 0.042\n", "epoch: 196, batch: 3000 // loss: 0.045\n", "epoch: 196, batch: 3100 // loss: 0.043\n", "epoch: 196, batch: 3200 // loss: 0.039\n", "epoch: 196, batch: 3300 // loss: 0.038\n", "epoch: 196, batch: 3400 // loss: 0.044\n", "epoch: 196, batch: 3500 // loss: 0.035\n", "epoch: 196, batch: 3600 // loss: 0.043\n", "epoch: 196, batch: 3700 // loss: 0.043\n", "\n", "epoch: 197, batch: 0 // loss: 0.053\n", "epoch: 197, batch: 100 // loss: 0.046\n", "epoch: 197, batch: 200 // loss: 0.043\n", "epoch: 197, batch: 300 // loss: 0.049\n", "epoch: 197, batch: 400 // loss: 0.046\n", "epoch: 197, batch: 500 // loss: 0.040\n", "epoch: 197, batch: 600 // loss: 0.040\n", "epoch: 197, batch: 700 // loss: 0.044\n", "epoch: 197, batch: 800 // loss: 0.042\n", "epoch: 197, batch: 900 // loss: 0.049\n", "epoch: 197, batch: 1000 // loss: 0.046\n", "epoch: 197, batch: 1100 // loss: 0.042\n", "epoch: 197, batch: 1200 // loss: 0.044\n", "epoch: 197, batch: 1300 // loss: 0.046\n", "epoch: 197, batch: 1400 // loss: 0.043\n", "epoch: 197, batch: 1500 // loss: 0.048\n", "epoch: 197, batch: 1600 // loss: 0.052\n", "epoch: 197, batch: 1700 // loss: 0.045\n", "epoch: 197, batch: 1800 // loss: 0.053\n", "epoch: 197, batch: 1900 // loss: 0.045\n", "epoch: 197, batch: 2000 // loss: 0.047\n", "epoch: 197, batch: 2100 // loss: 0.046\n", "epoch: 197, batch: 2200 // loss: 0.050\n", "epoch: 197, batch: 2300 // loss: 0.049\n", "epoch: 197, batch: 2400 // loss: 0.042\n", "epoch: 197, batch: 2500 // loss: 0.042\n", "epoch: 197, batch: 2600 // loss: 0.045\n", "epoch: 197, batch: 2700 // loss: 0.042\n", "epoch: 197, batch: 2800 // loss: 0.046\n", "epoch: 197, batch: 2900 // loss: 0.042\n", "epoch: 197, batch: 3000 // loss: 0.045\n", "epoch: 197, batch: 3100 // loss: 0.043\n", "epoch: 197, batch: 3200 // loss: 0.039\n", "epoch: 197, batch: 3300 // loss: 0.038\n", "epoch: 197, batch: 3400 // loss: 0.044\n", "epoch: 197, batch: 3500 // loss: 0.035\n", "epoch: 197, batch: 3600 // loss: 0.043\n", "epoch: 197, batch: 3700 // loss: 0.043\n", "\n", "epoch: 198, batch: 0 // loss: 0.053\n", "epoch: 198, batch: 100 // loss: 0.046\n", "epoch: 198, batch: 200 // loss: 0.043\n", "epoch: 198, batch: 300 // loss: 0.049\n", "epoch: 198, batch: 400 // loss: 0.046\n", "epoch: 198, batch: 500 // loss: 0.040\n", "epoch: 198, batch: 600 // loss: 0.040\n", "epoch: 198, batch: 700 // loss: 0.044\n", "epoch: 198, batch: 800 // loss: 0.042\n", "epoch: 198, batch: 900 // loss: 0.049\n", "epoch: 198, batch: 1000 // loss: 0.046\n", "epoch: 198, batch: 1100 // loss: 0.042\n", "epoch: 198, batch: 1200 // loss: 0.044\n", "epoch: 198, batch: 1300 // loss: 0.046\n", "epoch: 198, batch: 1400 // loss: 0.043\n", "epoch: 198, batch: 1500 // loss: 0.048\n", "epoch: 198, batch: 1600 // loss: 0.052\n", "epoch: 198, batch: 1700 // loss: 0.045\n", "epoch: 198, batch: 1800 // loss: 0.053\n", "epoch: 198, batch: 1900 // loss: 0.045\n", "epoch: 198, batch: 2000 // loss: 0.047\n", "epoch: 198, batch: 2100 // loss: 0.046\n", "epoch: 198, batch: 2200 // loss: 0.050\n", "epoch: 198, batch: 2300 // loss: 0.049\n", "epoch: 198, batch: 2400 // loss: 0.042\n", "epoch: 198, batch: 2500 // loss: 0.042\n", "epoch: 198, batch: 2600 // loss: 0.045\n", "epoch: 198, batch: 2700 // loss: 0.042\n", "epoch: 198, batch: 2800 // loss: 0.046\n", "epoch: 198, batch: 2900 // loss: 0.042\n", "epoch: 198, batch: 3000 // loss: 0.045\n", "epoch: 198, batch: 3100 // loss: 0.043\n", "epoch: 198, batch: 3200 // loss: 0.039\n", "epoch: 198, batch: 3300 // loss: 0.038\n", "epoch: 198, batch: 3400 // loss: 0.044\n", "epoch: 198, batch: 3500 // loss: 0.035\n", "epoch: 198, batch: 3600 // loss: 0.043\n", "epoch: 198, batch: 3700 // loss: 0.043\n", "\n", "epoch: 199, batch: 0 // loss: 0.053\n", "epoch: 199, batch: 100 // loss: 0.046\n", "epoch: 199, batch: 200 // loss: 0.043\n", "epoch: 199, batch: 300 // loss: 0.049\n", "epoch: 199, batch: 400 // loss: 0.046\n", "epoch: 199, batch: 500 // loss: 0.040\n", "epoch: 199, batch: 600 // loss: 0.040\n", "epoch: 199, batch: 700 // loss: 0.044\n", "epoch: 199, batch: 800 // loss: 0.042\n", "epoch: 199, batch: 900 // loss: 0.049\n", "epoch: 199, batch: 1000 // loss: 0.046\n", "epoch: 199, batch: 1100 // loss: 0.042\n", "epoch: 199, batch: 1200 // loss: 0.044\n", "epoch: 199, batch: 1300 // loss: 0.046\n", "epoch: 199, batch: 1400 // loss: 0.043\n", "epoch: 199, batch: 1500 // loss: 0.048\n", "epoch: 199, batch: 1600 // loss: 0.052\n", "epoch: 199, batch: 1700 // loss: 0.045\n", "epoch: 199, batch: 1800 // loss: 0.053\n", "epoch: 199, batch: 1900 // loss: 0.045\n", "epoch: 199, batch: 2000 // loss: 0.047\n", "epoch: 199, batch: 2100 // loss: 0.046\n", "epoch: 199, batch: 2200 // loss: 0.050\n", "epoch: 199, batch: 2300 // loss: 0.049\n", "epoch: 199, batch: 2400 // loss: 0.042\n", "epoch: 199, batch: 2500 // loss: 0.042\n", "epoch: 199, batch: 2600 // loss: 0.045\n", "epoch: 199, batch: 2700 // loss: 0.042\n", "epoch: 199, batch: 2800 // loss: 0.046\n", "epoch: 199, batch: 2900 // loss: 0.042\n", "epoch: 199, batch: 3000 // loss: 0.045\n", "epoch: 199, batch: 3100 // loss: 0.043\n", "epoch: 199, batch: 3200 // loss: 0.039\n", "epoch: 199, batch: 3300 // loss: 0.038\n", "epoch: 199, batch: 3400 // loss: 0.044\n", "epoch: 199, batch: 3500 // loss: 0.035\n", "epoch: 199, batch: 3600 // loss: 0.043\n", "epoch: 199, batch: 3700 // loss: 0.043\n" ] } ], "source": [ "loss_function = nn.MSELoss()\n", "auto = AE()\n", "optimizer = optim.SGD(auto.parameters(), lr=0.01, momentum=0.9)\n", "\n", "train_AE(X, X, auto, optimizer, loss_function, EPOCHS=50)" ] }, { "cell_type": "code", "execution_count": 196, "metadata": {}, "outputs": [], "source": [ "X_tilde = auto(X[:5000].float()).detach().numpy()" ] }, { "cell_type": "code", "execution_count": 197, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 197, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAAReElEQVR4nO3dW2xd5ZkG4PeNE+foHO0YJxhIQ6QMijJ0FEUjcVBGaArkglChjhqkKiOhphetaFEREzEXzQ0SGk1bejFUcgfUMHSoKrUVQeGikRWBKhBgokwIZCghcRonW87JITE5EeebCy9GDvH6/p299sn+3keybO/Pa6/fO3m99t7f+tdPM4OITH5TGj0AEakPhV0kCIVdJAiFXSQIhV0kiKn13BnJkG/9t7a2uvW2tja3Pn/+fLd+5cqV3NqpU6fcbc+fP+/WZ8yY4dYXLFjg1ufOnZtbu3r1qrttauwnT55061GZGce7vVDYST4A4BcAWgD8p5k9W+T+JqslS5a49XXr1rn1DRs2uHUvFC+//LK77e7du936ypUr3fojjzzi1u+7777cWuoPTWrsPT09bl2uVfHTeJItAP4DwIMA7gCwkeQd1RqYiFRXkdfsawEcMLODZnYZwG8B+IcgEWmYImFfCuDImO8HstuuQXIzyT6SfQX2JSIFFXnNPt6bANe9AWdmPQB6gLhv0Ik0gyJH9gEA3WO+vxnAsWLDEZFaKRL29wCsILmMZCuAbwPYXp1hiUi1scisN5LrATyH0dbbi2b2TOLnJ+zT+AcffDC39sQTT7jbXrhwwa2n+vAXL150616fftWqVe62nZ2dbr2/v9+tez1+ACiVSrm1zz77zN12+vTpbn3p0uveIrpGb29vbu3xxx93t53IatJnN7PXAbxe5D5EpD50uqxIEAq7SBAKu0gQCrtIEAq7SBAKu0gQhfrsN7yzJu6zL1++3K1v3bo1tzY4OOhuO2vWLLc+ZYr/Nzc179vrdXd3d+fWypHad6ru9dJTPfovvvjCrZ8+fdqte334M2fOuNs++eSTbr2Z5fXZdWQXCUJhFwlCYRcJQmEXCUJhFwlCYRcJQq23zPPPP+/WvWmmqfbTnDlz3Hrqcs2pFpV3ldbUtqlppqmxpX731DRVz8jIiFtP/W7ev1lq6u9LL73k1nfs2OHWG0mtN5HgFHaRIBR2kSAUdpEgFHaRIBR2kSAUdpEg1GfPrF271q17l4s+ceKEu+3Q0JBbTy3ZnJrq6bl8+bJbTy0HnXL27Fm3nurDF5H63ebNm1fxfWuKq4hMWAq7SBAKu0gQCrtIEAq7SBAKu0gQCrtIEIVWcZ1M3n33Xbf+9ttv59Yeeughd9t33nnHrU+d6v8zpC5FferUqdxaqhd98uRJt55aLjo1Nu93S/XoOzo63HqKN7YtW7YUuu+JqFDYSfYDOAdgBMAVM1tTjUGJSPVV48j+D2bmHx5EpOH0ml0kiKJhNwB/Ivk+yc3j/QDJzST7SPYV3JeIFFD0afxdZnaM5GIAO0n+r5m9OfYHzKwHQA/Q3BNhRCa7Qkd2MzuWfT4O4I8A/KljItIwFYed5GySbV9+DeAbAPZVa2AiUl0Vz2cn+TWMHs2B0ZcD/21mzyS2mZRP4z/99FO3/sYbb7j11Hz41Jzw4eHh3Nq5c+fcbVNaWlrcemquvddnnzZtmrttqoefmq++a9eu3Nprr73mbjuR5c1nr/g1u5kdBPC3FY9IROpKrTeRIBR2kSAUdpEgFHaRIBR2kSA0xTWTmmbqLQ989913u9s+84zbkUzylmQG/LHNnDnT3fbChQtuPfW4pOqXLl3KrU2ZUuxYk9p+MrfXKqEju0gQCrtIEAq7SBAKu0gQCrtIEAq7SBAKu0gQ6rNnvF51SqlUcuupKbDLli1z66nLOXvTWFPTY1P3neple9NrAf9y0KnHPLXvw4cPu3W5lo7sIkEo7CJBKOwiQSjsIkEo7CJBKOwiQSjsIkGoz14HqX5xW1ubW0/1yqdPn55bSy2L3Nra6tZTffjUktCeIuc2AMDx48cLbR+NjuwiQSjsIkEo7CJBKOwiQSjsIkEo7CJBKOwiQajPXiavV57qgw8MDLj11atXV7xvwL82e2pJ7tSyySMjI259xowZbt27Ln2qh9/e3u7Wjx496tY9RdYJmKiSR3aSL5I8TnLfmNsWktxJ8pPs84LaDlNEiirnafyvATzwldu2AOg1sxUAerPvRaSJJcNuZm8COP2VmzcA2JZ9vQ3Aw1Uel4hUWaWv2TvNrAQAZlYiuTjvB0luBrC5wv2ISJXU/A06M+sB0AMAJP13i0SkZiptvQ2S7AKA7LOmH4k0uUrDvh3ApuzrTQBerc5wRKRWkk/jSb4CYB2AdpIDAH4C4FkAvyP5GIC/AvhWLQc50fX397v1VB89Ned8wYL8zmdq36l+8qJFi9z60NBQxffvnR8ApB+XydgLr6Vk2M1sY07pviqPRURqSKfLigShsIsEobCLBKGwiwShsIsEoSmudeBN8wTSU2RTvO1bWlrcbVNTVFNjS7XevGmqqUtop6Sm58q1dGQXCUJhFwlCYRcJQmEXCUJhFwlCYRcJQmEXCUJ99jIV6YWnpmKeOHHCraeWRU71uotsm9r3zJkz3bq3rHJHR4e77fDwsFuXG6Mju0gQCrtIEAq7SBAKu0gQCrtIEAq7SBAKu0gQ6rOXqciSzal5296loAHg/Pnzbn3hwoVu3XPy5Em3PmvWLLc+b948t57q03tIuvVbb7214vuOeBlqHdlFglDYRYJQ2EWCUNhFglDYRYJQ2EWCUNhFglCfvUxF5rOn5qvv27fPrR85csSte73wixcvutt2dna69VSfPLUktLf/VI++VCq59SVLlrh1uVbyyE7yRZLHSe4bc9tWkkdJ7sk+1td2mCJSVDlP438N4IFxbv+5md2Zfbxe3WGJSLUlw25mbwI4XYexiEgNFXmD7gck92ZP83NP7ia5mWQfyb4C+xKRgioN+y8BLAdwJ4ASgJ/m/aCZ9ZjZGjNbU+G+RKQKKgq7mQ2a2YiZXQXwKwBrqzssEam2isJOsmvMt98E4PeORKThkn12kq8AWAegneQAgJ8AWEfyTgAGoB/A92o4xgnvnnvucesHDx5064cPH3brXi/77Nmz7rZz585166leeGrtea9P39XVlVsrx0033eTWFy9enFvzrmcP+NcvAIqdd9EoybCb2cZxbn6hBmMRkRrS6bIiQSjsIkEo7CJBKOwiQSjsIkHQzOq3M7J+O7tBRVot3d3d7rZPPfWUW0+13lLTVNvb23NrBw4ccLedPXu2W1+2bJlbP3PmjFtPtfaKSE2/PXfuXG7tueeeq/ZwmoaZjXsNbh3ZRYJQ2EWCUNhFglDYRYJQ2EWCUNhFglDYRYLQpaQzRaYs3n///W79o48+cuszZsxw66lpqrfddltu7ejRo+62K1eudOupx2VgYMCtr169Orc2ODjobrto0SK3PjQ05NaXLl2aW7v99tvdbVPnJ0xEOrKLBKGwiwShsIsEobCLBKGwiwShsIsEobCLBKE+exV4vWQA2Lt3r1tvaWlx662trW59+vTpbr3IvlNSfXivnpqnn7pOQOr8A6/unZsAqM8uIhOYwi4ShMIuEoTCLhKEwi4ShMIuEoTCLhKE+uxl8vqypVLJ3TY1X314eNitT53q/zNduXIltzZz5kx32xTvvoF0n73IOQDnz593652dnW7dm8vf0dFR0ZgmsuSRnWQ3yV0k95P8kOQPs9sXktxJ8pPs84LaD1dEKlXO0/grAH5sZn8D4O8BfJ/kHQC2AOg1sxUAerPvRaRJJcNuZiUz2519fQ7AfgBLAWwAsC37sW0AHq7VIEWkuBt6zU7yNgBfB/AOgE4zKwGjfxBILs7ZZjOAzcWGKSJFlR12knMA/B7Aj8zsLDnu2nHXMbMeAD3ZfTTtwo4ik11ZrTeS0zAa9N+Y2R+ymwdJdmX1LgDHazNEEamG5JGdo4fwFwDsN7OfjSltB7AJwLPZ51drMsImccstt+TWUu2nVOssNYU11bobGRmpeN8pCxb4TZZUa87bf2pshw4dcusrVqxw696lqufNm+duu3DhQrd++vRpt96MyvmfcBeA7wD4gOSe7LanMRry35F8DMBfAXyrNkMUkWpIht3M/gwg7wX6fdUdjojUik6XFQlCYRcJQmEXCUJhFwlCYRcJQlNcy+RdcnnKFP9vZmqq5qxZs9z6tGnT3Prly5dza6lzAMz8kxrnzJnj1lN99kuXLuXWvCWVAaCvr8+t33vvvW7dm3qc6vGnzi+YiH12HdlFglDYRYJQ2EWCUNhFglDYRYJQ2EWCUNhFglCfvUzt7e25tdR89BMnTrj1VatWufXUfHZvaeLU2FJ98ra2Nreeun9vWebUUtc7duxw62fOnHHr3thSffSi1wFoRjqyiwShsIsEobCLBKGwiwShsIsEobCLBKGwiwQx+ZqJNeL12VPz2U+dOuXWU9cwT/V8vXnbqT740NCQW//888/deup3LyK1lHVq7N5c/tTv1dXV5dY//vhjt96MdGQXCUJhFwlCYRcJQmEXCUJhFwlCYRcJQmEXCaKc9dm7AbwE4CYAVwH0mNkvSG4F8F0AX07WftrMXq/VQBvNu3566rrwqbnTKan57N5141M9+o6ODreemos/e/bsiu/fO3cBAJYvX+7WU9fE984BSG2bmsc/EZVzUs0VAD82s90k2wC8T3JnVvu5mf177YYnItVSzvrsJQCl7OtzJPcD8JfyEJGmc0Ov2UneBuDrAN7JbvoByb0kXyQ57nNVkptJ9pH01/IRkZoqO+wk5wD4PYAfmdlZAL8EsBzAnRg98v90vO3MrMfM1pjZmiqMV0QqVFbYSU7DaNB/Y2Z/AAAzGzSzETO7CuBXANbWbpgiUlQy7CQJ4AUA+83sZ2NuHzst6JsA9lV/eCJSLeW8G38XgO8A+IDknuy2pwFsJHknAAPQD+B7NRlhk1ixYkVu7dChQ+62qdZZSmoaqbfks3cpZwB466233Pqjjz7q1lOtvd7e3txa6vdK1efPn+/WvWmsqX+zXbt2ufWJqJx34/8MgOOUJm1PXWQy0hl0IkEo7CJBKOwiQSjsIkEo7CJBKOwiQdDM6rczsn47qzKvn5xa9jjVL05Nt0xN9Tx8+HBu7eabb3a37e/vd+sy8ZjZeK1yHdlFolDYRYJQ2EWCUNhFglDYRYJQ2EWCUNhFgqh3n/0EgLFN4XYAJ+s2gBvTrGNr1nEBGlulqjm2W81s3Ot31zXs1+2c7GvWa9M169iadVyAxlapeo1NT+NFglDYRYJodNh7Grx/T7OOrVnHBWhslarL2Br6ml1E6qfRR3YRqROFXSSIhoSd5AMkPyZ5gOSWRowhD8l+kh+Q3NPo9emyNfSOk9w35raFJHeS/CT7XGw96OqObSvJo9ljt4fk+gaNrZvkLpL7SX5I8ofZ7Q197Jxx1eVxq/trdpItAP4C4B8BDAB4D8BGM/uorgPJQbIfwBoza/gJGCTvBTAM4CUzW5Xd9m8ATpvZs9kfygVm9i9NMratAIYbvYx3tlpR19hlxgE8DOCf0cDHzhnXP6EOj1sjjuxrARwws4NmdhnAbwFsaMA4mp6ZvQng9Fdu3gBgW/b1Noz+Z6m7nLE1BTMrmdnu7OtzAL5cZryhj50zrrpoRNiXAjgy5vsBNNd67wbgTyTfJ7m50YMZR6eZlYDR/zwAFjd4PF+VXMa7nr6yzHjTPHaVLH9eVCPCPt71sZqp/3eXmf0dgAcBfD97uirlKWsZ73oZZ5nxplDp8udFNSLsAwC6x3x/M4BjDRjHuMzsWPb5OIA/ovmWoh78cgXd7PPxBo/n/zXTMt7jLTOOJnjsGrn8eSPC/h6AFSSXkWwF8G0A2xswjuuQnJ29cQKSswF8A823FPV2AJuyrzcBeLWBY7lGsyzjnbfMOBr82DV8+XMzq/sHgPUYfUf+UwD/2ogx5IzrawD+J/v4sNFjA/AKRp/WfYHRZ0SPAVgEoBfAJ9nnhU00tv8C8AGAvRgNVleDxnY3Rl8a7gWwJ/tY3+jHzhlXXR43nS4rEoTOoBMJQmEXCUJhFwlCYRcJQmEXCUJhFwlCYRcJ4v8ARgjbvwCW3h4AAAAASUVORK5CYII=\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(X[3]).reshape(28,28), cmap='gray')" ] }, { "cell_type": "code", "execution_count": 198, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 198, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAASAElEQVR4nO3dX4hd13XH8d+y/o40+mtZslCEnQY/2BTqmEHUuBSX0OD4wXYeUqKHoILp5CGGBPJQ4z7Ej6Y0CXkoAaU2UUrqEEiM9WDaCBMweQkeGVWWI7X+w1RRLEsyliVZ0mj0Z/VhjsPEnrvWzdn33nOd/f3AMDN33X3OnnPvmnPvXWfvbe4uAH/6buq6AwBGg2QHKkGyA5Ug2YFKkOxAJZaPdGfLl/uKFStGucuxYGZhPDsma9eubd0+q7bcuHEjjGftb7opPl9Ef3u27fn5+TB+6dKlMH79+vXW+/6kunr1qq5du7bkQS9KdjN7QNL3JC2T9G/u/lR0/xUrVuj2228v2WVnoid19oRfvjw+zNu2bQvj9957b+v2WcJcvnw5jF+9ejWMr1mzJoxH/4iybR8/fjyMHzx4MIyfP3++Zyz6RyCV/zPI/okOy+zsbM9Y65fxZrZM0r9K+oKkuyTtNrO72m4PwHCVvGffJekNd3/L3ecl/UTSw4PpFoBBK0n2HZJ+u+j3E81tf8DMps1sxsxmrl27VrA7ACVKkn2pDwE+9kbH3fe6+5S7T2XvXQEMT0myn5C0c9Hvn5L0dll3AAxLSbK/LOkOM/u0ma2U9GVJ+wfTLQCD1vp1tbtfM7PHJP2XFkpvz7j7awPr2YiVlM+y8tMtt9wSxu+5554w/tBDD4XxHTs+9lHJ723cuDFsm8lKVNlbs4sXL/aMvfPOO2HbqIwk5WXFY8eO9YxduHAhbDs3NxfGuyqtlSh6E+3uL0h6YUB9ATBEXC4LVIJkBypBsgOVINmBSpDsQCVIdqAS1Vy/mtXRszHlExMTrWKSNDk5GcY3bNgQxrO+nz17tmcsG/OdXSOQ7TsbIhvVs7O2y5YtC+PZNQTRPADZ8Nrs786Oa8k8Adn8B21xZgcqQbIDlSDZgUqQ7EAlSHagEiQ7UAlKb42SKa6zEtHKlSvDeFaay0TDULOpwLISUjbL6pUrV8J41LesPJU9ZiUz22ZKZwzOjnvJ7LVtS3Oc2YFKkOxAJUh2oBIkO1AJkh2oBMkOVIJkBypRTZ09q4VnoppwNt1y6ZLN2fZL9p3Ve7P2WT05imfDTLNtZ49pyfUHpfvOlExF3XZlJc7sQCVIdqASJDtQCZIdqATJDlSCZAcqQbIDlfhE1dlLpt/N4lndM6q7RlMW97PvYY6NLp2WOBvXnV0DENXSs78rq8Nnose0tMZfelyjvg1rKumiZDezWUkXJF2XdM3dpwbRKQCDN4gz+9+4+7sD2A6AIeI9O1CJ0mR3Sb8ws4NmNr3UHcxs2sxmzGwmex8EYHhKX8bf5+5vm9lWSQfM7Ji7v7T4Du6+V9JeSZqYmGg/yx6AIkVndnd/u/l+WtJzknYNolMABq91spvZWjNb9+HPkj4v6cigOgZgsEpexm+T9FxTE1wu6T/c/T9LOpONrY5qutn44mzb2ecJWb25RFbjn5+fD+OrVq3qGcv+7tJ4yXHJ/u6sFp7V+KN41jabD7/tmPIPDWs8e/R4te6xu78l6S/atgcwWpTegEqQ7EAlSHagEiQ7UAmSHajEWA1xLVnGNpOVWrLSW1TeKi3DZGWerAQVLQldUs7sZ9/ZNNglUy5nj0nJFNtZv0qGPJcaVpmXMztQCZIdqATJDlSCZAcqQbIDlSDZgUqQ7EAlxqrOntU2S+rwpdMWR7X00ql/szr7MKeSzrZ99uzZMH7bbbeF8Wj/2TEvvUYgugagtM6eHdds+9G1ESXDXyOc2YFKkOxAJUh2oBIkO1AJkh2oBMkOVIJkByoxVnX2TFR3Hfa47Wg8e2ldtHRp4mj8c2k9+dKlS2F8w4YNYbxkzHk2Vj57zKO/fZhTg0txHV2Kr9vIrn1ou9wzZ3agEiQ7UAmSHagEyQ5UgmQHKkGyA5Ug2YFKjFWdPaubRvXFbFnj0vHsUd20ZLx5P/vO6s1R39auXRu2vXjxYhjP5sSfnJwM49HjkvVtzZo1YTwbU14yn3/pWgBZnT2q82fPh7m5uVZ9Ss/sZvaMmZ02syOLbttsZgfM7PXm+6ZWewcwMv28jP+hpAc+ctvjkl509zskvdj8DmCMpcnu7i9Jeu8jNz8saV/z8z5Jjwy4XwAGrO0bk23uflKS3P2kmW3tdUczm5Y0LZW/DwLQ3tA/jXf3ve4+5e5TJDvQnbbJfsrMtktS8/304LoEYBjaJvt+SXuan/dIen4w3QEwLOnrajN7VtL9kraY2QlJ35L0lKSfmtmjko5L+lI/O3P3ojHpkaw2efny5aL2Ud00a1s6x3g2Zvzmm2/uGVu/fn3YtvS4ZOPho3pyVovO6vATExNhPKrTR/MTSOWfL2Xto/1nbbN1BnpuN7uDu+/uEfpcqz0C6ASXywKVINmBSpDsQCVIdqASJDtQibG6pK1kyeZsyuLSIbBtp++V8hLS5s2bw/itt94axqMSUzZlcjZcMjtu2XGPyopZiam09LZu3bqesdWrV4dts9Jc9nwpkQ1pjo4pU0kDINmBWpDsQCVIdqASJDtQCZIdqATJDlRirOrsmaiGmNW6s3hWd41qvtkQ1Cwe1YOlvO4aKV2qOrv2Idt+yVDRbOhvJrrGILv+INt3dtyy4xLFs6G/2XO5F87sQCVIdqASJDtQCZIdqATJDlSCZAcqQbIDlRhpnd3MwhphVuuOZHXTrDaZjY3euHFjz1i2tHBWax7mSjmldfbS5aaj45o9Zlm8ZInvTNa29PqDSPZ3R88XxrMDINmBWpDsQCVIdqASJDtQCZIdqATJDlRi5HX2aKxuVq+O6qrZ0sNZLTurs0f9Lq2jl45fjsZelyyp3I9s+yXzxmfHJRvnH20/G6+exUvHw0fxkrZFdXYze8bMTpvZkUW3PWlmvzOzQ83Xg9l2AHSrn3/rP5T0wBK3f9fd726+XhhstwAMWprs7v6SpPdG0BcAQ1Tyhu0xMzvcvMzf1OtOZjZtZjNmNjPM9bEAxNom+/clfUbS3ZJOSvp2rzu6+153n3L3qWEO+AAQa5Xs7n7K3a+7+w1JP5C0a7DdAjBorZLdzLYv+vWLko70ui+A8ZC+rjazZyXdL2mLmZ2Q9C1J95vZ3ZJc0qykr/azs6zOXrImdlZzLVlHPNt+9vYk23bWPquzR+2zOnhJDb+f7Ud9G/Zx+6TKxum3lR4td9+9xM1PD6EvAIaIy2WBSpDsQCVIdqASJDtQCZIdqMRY1S5KlrktaSvFZT0pnjI5Kz9l0y3Pz8+H8ZIpkUungs6OWza0OGqfHfNs2x988EEYv3DhQuu2Fy9eDONzc3NhPBOVPEuey9HjzZkdqATJDlSCZAcqQbIDlSDZgUqQ7EAlSHagEiOts7t7WFPO6q5RDfHKlSth26xmm+07GuJ66dKlsG1W083al0yTndWDz58/H8azvp87dy6MR/XqrJad9e39998P41GdPTumWTx7vmWiqaiz52Lb6y44swOVINmBSpDsQCVIdqASJDtQCZIdqATJDlTiE1Vnj+LZmPDSJZ2jumjJuGoprydn9ehoyuXsuGR1+OwagJJx39m+s21nfSvZd2mdPZtHoGQ56WgsfFSD58wOVIJkBypBsgOVINmBSpDsQCVIdqASJDtQiZHX2aP6Y1YTjuJZXTSryWZ19mg8e1YPLq3DZ9uPlsEuHec/zLnbs8ckOy4l1wBkx7R03vjsmpGoVh5d0yFJExMTPWNF88ab2U4z+6WZHTWz18zs683tm83sgJm93nzflG0LQHf6eRl/TdI33f1OSX8p6WtmdpekxyW96O53SHqx+R3AmEqT3d1Puvsrzc8XJB2VtEPSw5L2NXfbJ+mRYXUSQLk/6j27md0u6bOSfi1pm7uflBb+IZjZ1h5tpiVNS/n7YgDD0/en8WY2Kelnkr7h7vHIjUXcfa+7T7n7VHaBP4Dh6SvZzWyFFhL9x+7+8+bmU2a2vYlvl3R6OF0EMAjp62pbqBE8Lemou39nUWi/pD2Snmq+P9/PDqPSQDYsMBq+V7LkcrZtKS5hZeWtLF46lHPNmjWt91163LLtR+XSklJrP/GSxywrrWXto9KaJK1atapnLHu7my3p3HO7fdznPklfkfSqmR1qbntCC0n+UzN7VNJxSV9q1QMAI5Emu7v/SlKvf1OfG2x3AAwLl8sClSDZgUqQ7EAlSHagEiQ7UImRX79aMrQvimdts7pnJmpfuu2sxj/M4ZJZTbf0qsdo/yVTJktlfc+Oy5+i+v5ioFIkO1AJkh2oBMkOVIJkBypBsgOVINmBSoy0zm5mYe20ZBxvNNVzP/GSmm40lXPWViq/RiDbf0nbLJ7VyqO/PRrTXbptKX7Ms+dDtu3s2oes7yXXH7S9RoAzO1AJkh2oBMkOVIJkBypBsgOVINmBSpDsQCXGaj2mkrpqVhctqUVn7bNtr169uvW2pfy4RO2zGn20/G8/8axWXnLcs8c0O65R37J+ZXX4bO72rO9RvHScfy+c2YFKkOxAJUh2oBIkO1AJkh2oBMkOVIJkByrRz/rsOyX9SNKtkm5I2uvu3zOzJyX9g6QzzV2fcPcXsu2VzNcd1SaHPZ49qstmteZo/fR+2pfU2TNZ37Jadsm4cHdv3VbK+xZdI1BSo5fyOnvJccn+7rZrGPRzUc01Sd9091fMbJ2kg2Z2oIl9193/pY9tAOhYP+uzn5R0svn5gpkdlbRj2B0DMFh/1GtqM7td0mcl/bq56TEzO2xmz5jZph5tps1sxsxmspc+AIan72Q3s0lJP5P0DXc/L+n7kj4j6W4tnPm/vVQ7d9/r7lPuPlW6bhiA9vpKdjNboYVE/7G7/1yS3P2Uu1939xuSfiBp1/C6CaBUmuy28PHe05KOuvt3Ft2+fdHdvijpyOC7B2BQ+vk0/j5JX5H0qpkdam57QtJuM7tbkkualfTVfnaYLU8cKZl+t6SckbXPyixZaWxycjKMb9y4MYxv2bKlZyw73mfPng3jc3NzrfctSVu3bu0Zm5+fD9tu3rw5jK9fvz6MR2XFYZfeSqYXH9bb3X4+jf+VpKUyIa2pAxgfXEEHVIJkBypBsgOVINmBSpDsQCVIdqASYzWVdCaqs2d1zZKhtVn7M2fO9IxJ0tWrV8P4u+++G8ZPnToVxu+8886esez6gePHj4fxc+fOhfHZ2dkw/uabb/aMXb58OWx7+PDhMH7s2LEwHl1DkF0/UPp8KplKelg4swOVINmBSpDsQCVIdqASJDtQCZIdqATJDlTCsul8B7ozszOS/m/RTVskxUXm7oxr38a1XxJ9a2uQfbvN3W9ZKjDSZP/Yzs1m3H2qsw4ExrVv49ovib61Naq+8TIeqATJDlSi62Tf2/H+I+Pat3Htl0Tf2hpJ3zp9zw5gdLo+swMYEZIdqEQnyW5mD5jZ/5jZG2b2eBd96MXMZs3sVTM7ZGYzHfflGTM7bWZHFt222cwOmNnrzfcl19jrqG9PmtnvmmN3yMwe7KhvO83sl2Z21MxeM7OvN7d3euyCfo3kuI38PbuZLZP0v5L+VtIJSS9L2u3uvxlpR3ows1lJU+7e+QUYZvbXkj6Q9CN3//Pmtn+W9J67P9X8o9zk7v84Jn17UtIHXS/j3axWtH3xMuOSHpH09+rw2AX9+juN4Lh1cWbfJekNd3/L3ecl/UTSwx30Y+y5+0uS3vvIzQ9L2tf8vE8LT5aR69G3seDuJ939lebnC5I+XGa802MX9Gskukj2HZJ+u+j3Exqv9d5d0i/M7KCZTXfdmSVsc/eT0sKTR1Lv9ZW6kS7jPUofWWZ8bI5dm+XPS3WR7EtNijZO9b/73P0eSV+Q9LXm5Sr609cy3qOyxDLjY6Ht8uelukj2E5J2Lvr9U5Le7qAfS3L3t5vvpyU9p/FbivrUhyvoNt9Pd9yf3xunZbyXWmZcY3Dsulz+vItkf1nSHWb2aTNbKenLkvZ30I+PMbO1zQcnMrO1kj6v8VuKer+kPc3PeyQ932Ff/sC4LOPda5lxdXzsOl/+3N1H/iXpQS18Iv+mpH/qog89+vVnkv67+Xqt675JelYLL+uuauEV0aOSbpb0oqTXm++bx6hv/y7pVUmHtZBY2zvq219p4a3hYUmHmq8Huz52Qb9Gcty4XBaoBFfQAZUg2YFKkOxAJUh2oBIkO1AJkh2oBMkOVOL/Aaj9Ii47V1J2AAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(X_tilde[2]).reshape(28,28), cmap='gray')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Pull out the hidden representations (for first 5k points) and plot them." ] }, { "cell_type": "code", "execution_count": 199, "metadata": {}, "outputs": [], "source": [ "Zs = auto(X[:5000].float(), return_z=True).detach().numpy()" ] }, { "cell_type": "code", "execution_count": 200, "metadata": {}, "outputs": [], "source": [ "colors = ['r', 'g', 'b', 'c', 'm', 'y', 'k', 'w', 'orange', 'purple']\n", "c = [colors[y_i] for y_i in y[:5000]]" ] }, { "cell_type": "code", "execution_count": 201, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 201, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "plt.scatter(Zs[:,0], Zs[:,1], c=c)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Let's implement `AE2` extending the above by adding a non-linear activation function (try `Sigmoid`)." ] }, { "cell_type": "code", "execution_count": 202, "metadata": {}, "outputs": [], "source": [ "class AE2(nn.Module):\n", " \n", " def __init__(self, input_size=784, hidden_size=16):\n", " '''\n", " In the initializer we setup model parameters/layers.\n", " '''\n", " super(AE2, self).__init__() \n", "\n", " self.input_size = input_size\n", " self.hidden_size = hidden_size\n", " \n", " # input layer; from x -> z\n", " self.i = nn.Linear(self.input_size, self.hidden_size)\n", " \n", " self.a = nn.Sigmoid()\n", " \n", " # output layer\n", " self.o = nn.Linear(self.hidden_size, self.input_size)\n", " \n", "\n", " def forward(self, X, return_z=False):\n", " z = self.a(self.i(X))\n", " if return_z:\n", " return z\n", " return self.o(z)" ] }, { "cell_type": "code", "execution_count": 203, "metadata": {}, "outputs": [], "source": [ "auto2 = AE2()\n", "optimizer = optim.SGD(auto2.parameters(), lr=0.001, momentum=0.9)" ] }, { "cell_type": "code", "execution_count": 204, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 0.309\n", "epoch: 0, batch: 100 // loss: 0.292\n", "epoch: 0, batch: 200 // loss: 0.255\n", "epoch: 0, batch: 300 // loss: 0.236\n", "epoch: 0, batch: 400 // loss: 0.238\n", "epoch: 0, batch: 500 // loss: 0.233\n", "epoch: 0, batch: 600 // loss: 0.235\n", "epoch: 0, batch: 700 // loss: 0.242\n", "epoch: 0, batch: 800 // loss: 0.213\n", "epoch: 0, batch: 900 // loss: 0.255\n", "epoch: 0, batch: 1000 // loss: 0.230\n", "epoch: 0, batch: 1100 // loss: 0.260\n", "epoch: 0, batch: 1200 // loss: 0.204\n", "epoch: 0, batch: 1300 // loss: 0.248\n", "epoch: 0, batch: 1400 // loss: 0.205\n", "epoch: 0, batch: 1500 // loss: 0.204\n", "epoch: 0, batch: 1600 // loss: 0.234\n", "epoch: 0, batch: 1700 // loss: 0.219\n", "epoch: 0, batch: 1800 // loss: 0.253\n", "epoch: 0, batch: 1900 // loss: 0.223\n", "epoch: 0, batch: 2000 // loss: 0.197\n", "epoch: 0, batch: 2100 // loss: 0.197\n", "epoch: 0, batch: 2200 // loss: 0.244\n", "epoch: 0, batch: 2300 // loss: 0.216\n", "epoch: 0, batch: 2400 // loss: 0.168\n", "epoch: 0, batch: 2500 // loss: 0.184\n", "epoch: 0, batch: 2600 // loss: 0.233\n", "epoch: 0, batch: 2700 // loss: 0.183\n", "epoch: 0, batch: 2800 // loss: 0.236\n", "epoch: 0, batch: 2900 // loss: 0.172\n", "epoch: 0, batch: 3000 // loss: 0.190\n", "epoch: 0, batch: 3100 // loss: 0.226\n", "epoch: 0, batch: 3200 // loss: 0.164\n", "epoch: 0, batch: 3300 // loss: 0.192\n", "epoch: 0, batch: 3400 // loss: 0.194\n", "epoch: 0, batch: 3500 // loss: 0.205\n", "epoch: 0, batch: 3600 // loss: 0.203\n", "epoch: 0, batch: 3700 // loss: 0.224\n", "\n", "epoch: 1, batch: 0 // loss: 0.204\n", "epoch: 1, batch: 100 // loss: 0.213\n", "epoch: 1, batch: 200 // loss: 0.194\n", "epoch: 1, batch: 300 // loss: 0.182\n", "epoch: 1, batch: 400 // loss: 0.191\n", "epoch: 1, batch: 500 // loss: 0.189\n", "epoch: 1, batch: 600 // loss: 0.193\n", "epoch: 1, batch: 700 // loss: 0.201\n", "epoch: 1, batch: 800 // loss: 0.176\n", "epoch: 1, batch: 900 // loss: 0.217\n", "epoch: 1, batch: 1000 // loss: 0.193\n", "epoch: 1, batch: 1100 // loss: 0.222\n", "epoch: 1, batch: 1200 // loss: 0.171\n", "epoch: 1, batch: 1300 // loss: 0.212\n", "epoch: 1, batch: 1400 // loss: 0.172\n", "epoch: 1, batch: 1500 // loss: 0.172\n", "epoch: 1, batch: 1600 // loss: 0.199\n", "epoch: 1, batch: 1700 // loss: 0.186\n", "epoch: 1, batch: 1800 // loss: 0.217\n", "epoch: 1, batch: 1900 // loss: 0.189\n", "epoch: 1, batch: 2000 // loss: 0.166\n", "epoch: 1, batch: 2100 // loss: 0.167\n", "epoch: 1, batch: 2200 // loss: 0.209\n", "epoch: 1, batch: 2300 // loss: 0.184\n", "epoch: 1, batch: 2400 // loss: 0.141\n", "epoch: 1, batch: 2500 // loss: 0.154\n", "epoch: 1, batch: 2600 // loss: 0.198\n", "epoch: 1, batch: 2700 // loss: 0.154\n", "epoch: 1, batch: 2800 // loss: 0.201\n", "epoch: 1, batch: 2900 // loss: 0.145\n", "epoch: 1, batch: 3000 // loss: 0.160\n", "epoch: 1, batch: 3100 // loss: 0.191\n", "epoch: 1, batch: 3200 // loss: 0.138\n", "epoch: 1, batch: 3300 // loss: 0.161\n", "epoch: 1, batch: 3400 // loss: 0.162\n", "epoch: 1, batch: 3500 // loss: 0.171\n", "epoch: 1, batch: 3600 // loss: 0.171\n", "epoch: 1, batch: 3700 // loss: 0.189\n", "\n", "epoch: 2, batch: 0 // loss: 0.174\n", "epoch: 2, batch: 100 // loss: 0.178\n", "epoch: 2, batch: 200 // loss: 0.163\n", "epoch: 2, batch: 300 // loss: 0.153\n", "epoch: 2, batch: 400 // loss: 0.160\n", "epoch: 2, batch: 500 // loss: 0.156\n", "epoch: 2, batch: 600 // loss: 0.160\n", "epoch: 2, batch: 700 // loss: 0.167\n", "epoch: 2, batch: 800 // loss: 0.147\n", "epoch: 2, batch: 900 // loss: 0.181\n", "epoch: 2, batch: 1000 // loss: 0.158\n", "epoch: 2, batch: 1100 // loss: 0.183\n", "epoch: 2, batch: 1200 // loss: 0.143\n", "epoch: 2, batch: 1300 // loss: 0.176\n", "epoch: 2, batch: 1400 // loss: 0.142\n", "epoch: 2, batch: 1500 // loss: 0.142\n", "epoch: 2, batch: 1600 // loss: 0.164\n", "epoch: 2, batch: 1700 // loss: 0.153\n", "epoch: 2, batch: 1800 // loss: 0.178\n", "epoch: 2, batch: 1900 // loss: 0.155\n", "epoch: 2, batch: 2000 // loss: 0.136\n", "epoch: 2, batch: 2100 // loss: 0.139\n", "epoch: 2, batch: 2200 // loss: 0.172\n", "epoch: 2, batch: 2300 // loss: 0.152\n", "epoch: 2, batch: 2400 // loss: 0.116\n", "epoch: 2, batch: 2500 // loss: 0.126\n", "epoch: 2, batch: 2600 // loss: 0.161\n", "epoch: 2, batch: 2700 // loss: 0.125\n", "epoch: 2, batch: 2800 // loss: 0.165\n", "epoch: 2, batch: 2900 // loss: 0.118\n", "epoch: 2, batch: 3000 // loss: 0.130\n", "epoch: 2, batch: 3100 // loss: 0.154\n", "epoch: 2, batch: 3200 // loss: 0.113\n", "epoch: 2, batch: 3300 // loss: 0.129\n", "epoch: 2, batch: 3400 // loss: 0.130\n", "epoch: 2, batch: 3500 // loss: 0.137\n", "epoch: 2, batch: 3600 // loss: 0.139\n", "epoch: 2, batch: 3700 // loss: 0.153\n", "\n", "epoch: 3, batch: 0 // loss: 0.144\n", "epoch: 3, batch: 100 // loss: 0.143\n", "epoch: 3, batch: 200 // loss: 0.134\n", "epoch: 3, batch: 300 // loss: 0.126\n", "epoch: 3, batch: 400 // loss: 0.130\n", "epoch: 3, batch: 500 // loss: 0.125\n", "epoch: 3, batch: 600 // loss: 0.127\n", "epoch: 3, batch: 700 // loss: 0.133\n", "epoch: 3, batch: 800 // loss: 0.120\n", "epoch: 3, batch: 900 // loss: 0.147\n", "epoch: 3, batch: 1000 // loss: 0.125\n", "epoch: 3, batch: 1100 // loss: 0.145\n", "epoch: 3, batch: 1200 // loss: 0.116\n", "epoch: 3, batch: 1300 // loss: 0.141\n", "epoch: 3, batch: 1400 // loss: 0.114\n", "epoch: 3, batch: 1500 // loss: 0.115\n", "epoch: 3, batch: 1600 // loss: 0.132\n", "epoch: 3, batch: 1700 // loss: 0.124\n", "epoch: 3, batch: 1800 // loss: 0.142\n", "epoch: 3, batch: 1900 // loss: 0.125\n", "epoch: 3, batch: 2000 // loss: 0.110\n", "epoch: 3, batch: 2100 // loss: 0.115\n", "epoch: 3, batch: 2200 // loss: 0.139\n", "epoch: 3, batch: 2300 // loss: 0.123\n", "epoch: 3, batch: 2400 // loss: 0.096\n", "epoch: 3, batch: 2500 // loss: 0.102\n", "epoch: 3, batch: 2600 // loss: 0.129\n", "epoch: 3, batch: 2700 // loss: 0.101\n", "epoch: 3, batch: 2800 // loss: 0.133\n", "epoch: 3, batch: 2900 // loss: 0.096\n", "epoch: 3, batch: 3000 // loss: 0.106\n", "epoch: 3, batch: 3100 // loss: 0.122\n", "epoch: 3, batch: 3200 // loss: 0.094\n", "epoch: 3, batch: 3300 // loss: 0.104\n", "epoch: 3, batch: 3400 // loss: 0.103\n", "epoch: 3, batch: 3500 // loss: 0.109\n", "epoch: 3, batch: 3600 // loss: 0.114\n", "epoch: 3, batch: 3700 // loss: 0.124\n", "\n", "epoch: 4, batch: 0 // loss: 0.120\n", "epoch: 4, batch: 100 // loss: 0.115\n", "epoch: 4, batch: 200 // loss: 0.112\n", "epoch: 4, batch: 300 // loss: 0.105\n", "epoch: 4, batch: 400 // loss: 0.108\n", "epoch: 4, batch: 500 // loss: 0.101\n", "epoch: 4, batch: 600 // loss: 0.103\n", "epoch: 4, batch: 700 // loss: 0.108\n", "epoch: 4, batch: 800 // loss: 0.101\n", "epoch: 4, batch: 900 // loss: 0.121\n", "epoch: 4, batch: 1000 // loss: 0.100\n", "epoch: 4, batch: 1100 // loss: 0.117\n", "epoch: 4, batch: 1200 // loss: 0.097\n", "epoch: 4, batch: 1300 // loss: 0.116\n", "epoch: 4, batch: 1400 // loss: 0.095\n", "epoch: 4, batch: 1500 // loss: 0.096\n", "epoch: 4, batch: 1600 // loss: 0.109\n", "epoch: 4, batch: 1700 // loss: 0.104\n", "epoch: 4, batch: 1800 // loss: 0.116\n", "epoch: 4, batch: 1900 // loss: 0.104\n", "epoch: 4, batch: 2000 // loss: 0.092\n", "epoch: 4, batch: 2100 // loss: 0.098\n", "epoch: 4, batch: 2200 // loss: 0.117\n", "epoch: 4, batch: 2300 // loss: 0.104\n", "epoch: 4, batch: 2400 // loss: 0.084\n", "epoch: 4, batch: 2500 // loss: 0.086\n", "epoch: 4, batch: 2600 // loss: 0.108\n", "epoch: 4, batch: 2700 // loss: 0.086\n", "epoch: 4, batch: 2800 // loss: 0.112\n", "epoch: 4, batch: 2900 // loss: 0.082\n", "epoch: 4, batch: 3000 // loss: 0.090\n", "epoch: 4, batch: 3100 // loss: 0.102\n", "epoch: 4, batch: 3200 // loss: 0.082\n", "epoch: 4, batch: 3300 // loss: 0.088\n", "epoch: 4, batch: 3400 // loss: 0.086\n", "epoch: 4, batch: 3500 // loss: 0.091\n", "epoch: 4, batch: 3600 // loss: 0.098\n", "epoch: 4, batch: 3700 // loss: 0.105\n", "\n", "epoch: 5, batch: 0 // loss: 0.105\n", "epoch: 5, batch: 100 // loss: 0.098\n", "epoch: 5, batch: 200 // loss: 0.098\n", "epoch: 5, batch: 300 // loss: 0.092\n", "epoch: 5, batch: 400 // loss: 0.094\n", "epoch: 5, batch: 500 // loss: 0.086\n", "epoch: 5, batch: 600 // loss: 0.089\n", "epoch: 5, batch: 700 // loss: 0.093\n", "epoch: 5, batch: 800 // loss: 0.089\n", "epoch: 5, batch: 900 // loss: 0.105\n", "epoch: 5, batch: 1000 // loss: 0.086\n", "epoch: 5, batch: 1100 // loss: 0.099\n", "epoch: 5, batch: 1200 // loss: 0.087\n", "epoch: 5, batch: 1300 // loss: 0.100\n", "epoch: 5, batch: 1400 // loss: 0.084\n", "epoch: 5, batch: 1500 // loss: 0.086\n", "epoch: 5, batch: 1600 // loss: 0.095\n", "epoch: 5, batch: 1700 // loss: 0.092\n", "epoch: 5, batch: 1800 // loss: 0.100\n", "epoch: 5, batch: 1900 // loss: 0.091\n", "epoch: 5, batch: 2000 // loss: 0.083\n", "epoch: 5, batch: 2100 // loss: 0.089\n", "epoch: 5, batch: 2200 // loss: 0.103\n", "epoch: 5, batch: 2300 // loss: 0.093\n", "epoch: 5, batch: 2400 // loss: 0.078\n", "epoch: 5, batch: 2500 // loss: 0.078\n", "epoch: 5, batch: 2600 // loss: 0.095\n", "epoch: 5, batch: 2700 // loss: 0.078\n", "epoch: 5, batch: 2800 // loss: 0.099\n", "epoch: 5, batch: 2900 // loss: 0.075\n", "epoch: 5, batch: 3000 // loss: 0.081\n", "epoch: 5, batch: 3100 // loss: 0.090\n", "epoch: 5, batch: 3200 // loss: 0.076\n", "epoch: 5, batch: 3300 // loss: 0.079\n", "epoch: 5, batch: 3400 // loss: 0.077\n", "epoch: 5, batch: 3500 // loss: 0.081\n", "epoch: 5, batch: 3600 // loss: 0.089\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 5, batch: 3700 // loss: 0.094\n", "\n", "epoch: 6, batch: 0 // loss: 0.097\n", "epoch: 6, batch: 100 // loss: 0.088\n", "epoch: 6, batch: 200 // loss: 0.091\n", "epoch: 6, batch: 300 // loss: 0.085\n", "epoch: 6, batch: 400 // loss: 0.087\n", "epoch: 6, batch: 500 // loss: 0.078\n", "epoch: 6, batch: 600 // loss: 0.080\n", "epoch: 6, batch: 700 // loss: 0.084\n", "epoch: 6, batch: 800 // loss: 0.083\n", "epoch: 6, batch: 900 // loss: 0.096\n", "epoch: 6, batch: 1000 // loss: 0.077\n", "epoch: 6, batch: 1100 // loss: 0.089\n", "epoch: 6, batch: 1200 // loss: 0.081\n", "epoch: 6, batch: 1300 // loss: 0.092\n", "epoch: 6, batch: 1400 // loss: 0.078\n", "epoch: 6, batch: 1500 // loss: 0.081\n", "epoch: 6, batch: 1600 // loss: 0.088\n", "epoch: 6, batch: 1700 // loss: 0.085\n", "epoch: 6, batch: 1800 // loss: 0.092\n", "epoch: 6, batch: 1900 // loss: 0.085\n", "epoch: 6, batch: 2000 // loss: 0.078\n", "epoch: 6, batch: 2100 // loss: 0.085\n", "epoch: 6, batch: 2200 // loss: 0.096\n", "epoch: 6, batch: 2300 // loss: 0.087\n", "epoch: 6, batch: 2400 // loss: 0.075\n", "epoch: 6, batch: 2500 // loss: 0.073\n", "epoch: 6, batch: 2600 // loss: 0.088\n", "epoch: 6, batch: 2700 // loss: 0.073\n", "epoch: 6, batch: 2800 // loss: 0.092\n", "epoch: 6, batch: 2900 // loss: 0.071\n", "epoch: 6, batch: 3000 // loss: 0.077\n", "epoch: 6, batch: 3100 // loss: 0.083\n", "epoch: 6, batch: 3200 // loss: 0.073\n", "epoch: 6, batch: 3300 // loss: 0.075\n", "epoch: 6, batch: 3400 // loss: 0.072\n", "epoch: 6, batch: 3500 // loss: 0.076\n", "epoch: 6, batch: 3600 // loss: 0.084\n", "epoch: 6, batch: 3700 // loss: 0.088\n", "\n", "epoch: 7, batch: 0 // loss: 0.092\n", "epoch: 7, batch: 100 // loss: 0.083\n", "epoch: 7, batch: 200 // loss: 0.086\n", "epoch: 7, batch: 300 // loss: 0.082\n", "epoch: 7, batch: 400 // loss: 0.083\n", "epoch: 7, batch: 500 // loss: 0.073\n", "epoch: 7, batch: 600 // loss: 0.076\n", "epoch: 7, batch: 700 // loss: 0.079\n", "epoch: 7, batch: 800 // loss: 0.080\n", "epoch: 7, batch: 900 // loss: 0.090\n", "epoch: 7, batch: 1000 // loss: 0.073\n", "epoch: 7, batch: 1100 // loss: 0.083\n", "epoch: 7, batch: 1200 // loss: 0.079\n", "epoch: 7, batch: 1300 // loss: 0.087\n", "epoch: 7, batch: 1400 // loss: 0.075\n", "epoch: 7, batch: 1500 // loss: 0.078\n", "epoch: 7, batch: 1600 // loss: 0.084\n", "epoch: 7, batch: 1700 // loss: 0.081\n", "epoch: 7, batch: 1800 // loss: 0.087\n", "epoch: 7, batch: 1900 // loss: 0.081\n", "epoch: 7, batch: 2000 // loss: 0.075\n", "epoch: 7, batch: 2100 // loss: 0.083\n", "epoch: 7, batch: 2200 // loss: 0.091\n", "epoch: 7, batch: 2300 // loss: 0.084\n", "epoch: 7, batch: 2400 // loss: 0.073\n", "epoch: 7, batch: 2500 // loss: 0.071\n", "epoch: 7, batch: 2600 // loss: 0.084\n", "epoch: 7, batch: 2700 // loss: 0.071\n", "epoch: 7, batch: 2800 // loss: 0.088\n", "epoch: 7, batch: 2900 // loss: 0.069\n", "epoch: 7, batch: 3000 // loss: 0.074\n", "epoch: 7, batch: 3100 // loss: 0.079\n", "epoch: 7, batch: 3200 // loss: 0.072\n", "epoch: 7, batch: 3300 // loss: 0.072\n", "epoch: 7, batch: 3400 // loss: 0.069\n", "epoch: 7, batch: 3500 // loss: 0.072\n", "epoch: 7, batch: 3600 // loss: 0.081\n", "epoch: 7, batch: 3700 // loss: 0.085\n", "\n", "epoch: 8, batch: 0 // loss: 0.089\n", "epoch: 8, batch: 100 // loss: 0.080\n", "epoch: 8, batch: 200 // loss: 0.084\n", "epoch: 8, batch: 300 // loss: 0.080\n", "epoch: 8, batch: 400 // loss: 0.081\n", "epoch: 8, batch: 500 // loss: 0.071\n", "epoch: 8, batch: 600 // loss: 0.073\n", "epoch: 8, batch: 700 // loss: 0.076\n", "epoch: 8, batch: 800 // loss: 0.078\n", "epoch: 8, batch: 900 // loss: 0.087\n", "epoch: 8, batch: 1000 // loss: 0.070\n", "epoch: 8, batch: 1100 // loss: 0.079\n", "epoch: 8, batch: 1200 // loss: 0.077\n", "epoch: 8, batch: 1300 // loss: 0.084\n", "epoch: 8, batch: 1400 // loss: 0.074\n", "epoch: 8, batch: 1500 // loss: 0.077\n", "epoch: 8, batch: 1600 // loss: 0.081\n", "epoch: 8, batch: 1700 // loss: 0.079\n", "epoch: 8, batch: 1800 // loss: 0.084\n", "epoch: 8, batch: 1900 // loss: 0.079\n", "epoch: 8, batch: 2000 // loss: 0.074\n", "epoch: 8, batch: 2100 // loss: 0.081\n", "epoch: 8, batch: 2200 // loss: 0.089\n", "epoch: 8, batch: 2300 // loss: 0.082\n", "epoch: 8, batch: 2400 // loss: 0.072\n", "epoch: 8, batch: 2500 // loss: 0.070\n", "epoch: 8, batch: 2600 // loss: 0.081\n", "epoch: 8, batch: 2700 // loss: 0.070\n", "epoch: 8, batch: 2800 // loss: 0.085\n", "epoch: 8, batch: 2900 // loss: 0.068\n", "epoch: 8, batch: 3000 // loss: 0.072\n", "epoch: 8, batch: 3100 // loss: 0.077\n", "epoch: 8, batch: 3200 // loss: 0.071\n", "epoch: 8, batch: 3300 // loss: 0.070\n", "epoch: 8, batch: 3400 // loss: 0.068\n", "epoch: 8, batch: 3500 // loss: 0.070\n", "epoch: 8, batch: 3600 // loss: 0.079\n", "epoch: 8, batch: 3700 // loss: 0.082\n", "\n", "epoch: 9, batch: 0 // loss: 0.088\n", "epoch: 9, batch: 100 // loss: 0.078\n", "epoch: 9, batch: 200 // loss: 0.082\n", "epoch: 9, batch: 300 // loss: 0.079\n", "epoch: 9, batch: 400 // loss: 0.079\n", "epoch: 9, batch: 500 // loss: 0.069\n", "epoch: 9, batch: 600 // loss: 0.071\n", "epoch: 9, batch: 700 // loss: 0.074\n", "epoch: 9, batch: 800 // loss: 0.077\n", "epoch: 9, batch: 900 // loss: 0.085\n", "epoch: 9, batch: 1000 // loss: 0.069\n", "epoch: 9, batch: 1100 // loss: 0.077\n", "epoch: 9, batch: 1200 // loss: 0.076\n", "epoch: 9, batch: 1300 // loss: 0.082\n", "epoch: 9, batch: 1400 // loss: 0.072\n", "epoch: 9, batch: 1500 // loss: 0.076\n", "epoch: 9, batch: 1600 // loss: 0.080\n", "epoch: 9, batch: 1700 // loss: 0.077\n", "epoch: 9, batch: 1800 // loss: 0.082\n", "epoch: 9, batch: 1900 // loss: 0.077\n", "epoch: 9, batch: 2000 // loss: 0.073\n", "epoch: 9, batch: 2100 // loss: 0.080\n", "epoch: 9, batch: 2200 // loss: 0.087\n", "epoch: 9, batch: 2300 // loss: 0.080\n", "epoch: 9, batch: 2400 // loss: 0.072\n", "epoch: 9, batch: 2500 // loss: 0.069\n", "epoch: 9, batch: 2600 // loss: 0.079\n", "epoch: 9, batch: 2700 // loss: 0.069\n", "epoch: 9, batch: 2800 // loss: 0.084\n", "epoch: 9, batch: 2900 // loss: 0.068\n", "epoch: 9, batch: 3000 // loss: 0.071\n", "epoch: 9, batch: 3100 // loss: 0.075\n", "epoch: 9, batch: 3200 // loss: 0.071\n", "epoch: 9, batch: 3300 // loss: 0.069\n", "epoch: 9, batch: 3400 // loss: 0.067\n", "epoch: 9, batch: 3500 // loss: 0.068\n", "epoch: 9, batch: 3600 // loss: 0.077\n", "epoch: 9, batch: 3700 // loss: 0.081\n" ] } ], "source": [ "train_AE(X, X, auto2, optimizer, loss_function)" ] }, { "cell_type": "code", "execution_count": 205, "metadata": {}, "outputs": [], "source": [ "Zs = auto2(X[:5000].float(), return_z=True).detach().numpy()" ] }, { "cell_type": "code", "execution_count": 206, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 206, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "plt.scatter(Zs[:,0], Zs[:,1], c=c)" ] }, { "cell_type": "code", "execution_count": 207, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "(5000, 16)" ] }, "execution_count": 207, "metadata": {}, "output_type": "execute_result" } ], "source": [ "Zs.shape" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### TODO 3\n", "\n", "*Denoising* auto-encoder. Now let's take as our target *corrupted* versions of the inputs. To create a corrupt version we will perturb the input pixel values by some random noise." ] }, { "cell_type": "code", "execution_count": 208, "metadata": {}, "outputs": [], "source": [ "def corrupt(x, var=0.01):\n", " return x + np.random.normal(np.zeros(x.shape), var)" ] }, { "cell_type": "code", "execution_count": 209, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "tensor([0., 0., 0., 0., 0., 0., 0., 0., 0., 0.], dtype=torch.float64)" ] }, "execution_count": 209, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X[0,:10]" ] }, { "cell_type": "code", "execution_count": 210, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "tensor([ 0.0073, 0.0166, -0.0076, 0.0072, 0.0170, 0.0171, 0.0167, 0.0069,\n", " 0.0050, 0.0150], dtype=torch.float64)" ] }, "execution_count": 210, "metadata": {}, "output_type": "execute_result" } ], "source": [ "corrupt(X[0])[:10]" ] }, { "cell_type": "code", "execution_count": 211, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 211, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAAR1ElEQVR4nO3dbYyV5ZkH8P9fXlRe5EVEhpcIVoxsNi6sIxpBU60Q9INQtVg+NBh1aUxN2qQma9wPNfGDRLdt9gNpMlVTunZtmhQixrcS0sRuwMpIWECmrYBYBsYBBIHhbRi49sM8mCnOc13jec45z5H7/0vIzJxr7nPuc878OWfmeu7npplBRC5+l5Q9ARGpD4VdJBEKu0giFHaRRCjsIokYXM8bI6k//YvUmJmxv8sLvbKTXEDyryR3kHyqyHWJSG2x0j47yUEA/gZgHoB2ABsBLDGz7c4YvbKL1FgtXtlnA9hhZrvMrBvAbwEsLHB9IlJDRcI+CcCePl+3Z5f9A5LLSLaSbC1wWyJSUJE/0PX3VuFLb9PNrAVAC6C38SJlKvLK3g5gSp+vJwPYV2w6IlIrRcK+EcB0ktNIDgXwXQBrqjMtEam2it/Gm1kPyScAvANgEICXzezDqs1MRKqq4tZbRTem39lFaq4mB9WIyNeHwi6SCIVdJBEKu0giFHaRRCjsIolQ2EUSobCLJEJhF0mEwi6SCIVdJBEKu0giFHaRRNT1VNJSf2S/C6C+UHTV48iRI9363Llzc2tvvfVWoduO7tugQYNyaz09PYVuu6ho7p5KnzO9soskQmEXSYTCLpIIhV0kEQq7SCIUdpFEKOwiiVCf/SJ3ySX+/+dnz55169ddd51bf+yxx9z6yZMnc2vHjx93x546dcqtv//++269SC896oNHj2s0vsjcvOMHvOdTr+wiiVDYRRKhsIskQmEXSYTCLpIIhV0kEQq7SCLUZ7/IeT1ZIO6z33XXXW797rvvduvt7e25tUsvvdQdO2zYMLc+b948t/7iiy/m1jo7O92x0Zrx6HGLjBgxIrd27tw5d+yJEycqus1CYSe5G8AxAGcB9JhZc5HrE5HaqcYr+51mdrAK1yMiNaTf2UUSUTTsBuAPJD8guay/byC5jGQrydaCtyUiBRR9Gz/HzPaRHA9gLcm/mNm7fb/BzFoAtAAAyWJnNxSRihV6ZTezfdnH/QBWA5hdjUmJSPVVHHaSw0mOPP85gPkAtlVrYiJSXUXexl8NYHW2bncwgP8xs7erMiupmu7u7kLjb775Zrc+depUt+71+aM14e+8845bnzVrllt//vnnc2utrf6fkLZu3erW29ra3Prs2f6bXO9xXb9+vTt2w4YNubWurq7cWsVhN7NdAP6l0vEiUl9qvYkkQmEXSYTCLpIIhV0kEQq7SCJYdMver3RjOoKuJrzTFkfPb7RM1GtfAcDo0aPd+pkzZ3Jr0VLOyMaNG936jh07cmtFW5JNTU1u3bvfgD/3Bx980B27YsWK3FprayuOHj3a7w+EXtlFEqGwiyRCYRdJhMIukgiFXSQRCrtIIhR2kUSoz94Aou19i4ie3/fee8+tR0tYI959i7YtLtoL97Z8jnr8mzZtcuteDx+I79uCBQtya9dee607dtKkSW7dzNRnF0mZwi6SCIVdJBEKu0giFHaRRCjsIolQ2EUSoS2bG0A9j3W40OHDh916tG775MmTbt3blnnwYP/Hz9vWGPD76ABw+eWX59aiPvvtt9/u1m+77Ta3Hp0me/z48bm1t9+uzRnZ9coukgiFXSQRCrtIIhR2kUQo7CKJUNhFEqGwiyRCffbEDRs2zK1H/eKofuLEidzakSNH3LGfffaZW4/W2nvHL0TnEIjuV/S4nT171q17ff4pU6a4YysVvrKTfJnkfpLb+lw2luRakh9lH8fUZHYiUjUDeRv/KwAXnlbjKQDrzGw6gHXZ1yLSwMKwm9m7AA5dcPFCACuzz1cCWFTleYlIlVX6O/vVZtYBAGbWQTL3QF+SywAsq/B2RKRKav4HOjNrAdAC6ISTImWqtPXWSbIJALKP+6s3JRGphUrDvgbA0uzzpQBeq850RKRWwrfxJF8F8E0A40i2A/gJgOUAfkfyUQB/B/CdWk7yYle05+v1dKM14RMnTnTrp0+fLlT31rNH54X3evRAvDe816eP+uRDhw5168eOHXPro0aNcutbtmzJrUXPWXNzc25t+/btubUw7Ga2JKf0rWisiDQOHS4rkgiFXSQRCrtIIhR2kUQo7CKJ0BLXBhCdSnrQoEFu3Wu9PfTQQ+7YCRMmuPUDBw64de90zYC/lHP48OHu2GipZ9S689p+Z86cccdGp7mO7veVV17p1lesWJFbmzlzpjvWm5vXxtUru0giFHaRRCjsIolQ2EUSobCLJEJhF0mEwi6SCNZzu2CdqaZ/UU+3p6en4uu+5ZZb3Pobb7zh1qMtmYscAzBy5Eh3bLQlc3Sq6SFDhlRUA+JjAKKtriPefXvhhRfcsa+88opbN7N+m+16ZRdJhMIukgiFXSQRCrtIIhR2kUQo7CKJUNhFEvG1Ws/urdWN+r3R6Zij0zl765+9NdsDUaSPHnnzzTfd+vHjx9161GePTrnsHccRrZWPntPLLrvMrUdr1ouMjZ7zaO433nhjbi3ayrpSemUXSYTCLpIIhV0kEQq7SCIUdpFEKOwiiVDYRRLRUH32Imuja9mrrrU77rjDrT/wwANufc6cObm1aNvjaE141EeP1uJ7z1k0t+jnwTsvPOD34aPzOERzi0SPW1dXV27t/vvvd8e+/vrrFc0pfGUn+TLJ/SS39bnsGZJ7SW7O/t1b0a2LSN0M5G38rwAs6Ofyn5vZzOyff5iWiJQuDLuZvQvgUB3mIiI1VOQPdE+Q3JK9zR+T900kl5FsJdla4LZEpKBKw/4LAN8AMBNAB4Cf5n2jmbWYWbOZNVd4WyJSBRWF3cw6zeysmZ0D8EsAs6s7LRGptorCTrKpz5ffBrAt73tFpDGE540n+SqAbwIYB6ATwE+yr2cCMAC7AXzfzDrCGyvxvPFjx4516xMnTnTr06dPr3hs1De9/vrr3frp06fdurdWP1qXHe0zvm/fPrcenX/d6zdHe5hH+68PGzbMra9fvz63NmLECHdsdOxDtJ49WpPuPW6dnZ3u2BkzZrj1vPPGhwfVmNmSfi5+KRonIo1Fh8uKJEJhF0mEwi6SCIVdJBEKu0giGmrL5ltvvdUd/+yzz+bWrrrqKnfs6NGj3bq3FBPwl1t+/vnn7tho+W3UQopaUN5psKNTQbe1tbn1xYsXu/XWVv8oaG9b5jFjco+yBgBMnTrVrUd27dqVW4u2iz527Jhbj5bARi1Nr/V3xRVXuGOjnxdt2SySOIVdJBEKu0giFHaRRCjsIolQ2EUSobCLJKLufXavX71hwwZ3fFNTU24t6pNH9SKnDo5OeRz1uosaNWpUbm3cuHHu2Icfftitz58/360//vjjbt1bInvq1Cl37Mcff+zWvT464C9LLrq8NlraG/XxvfHR8tlrrrnGravPLpI4hV0kEQq7SCIUdpFEKOwiiVDYRRKhsIskoq599nHjxtl9992XW1++fLk7fufOnbm16NTAUT3a/tcT9Vy9PjgA7Nmzx61Hp3P21vJ7p5kGgAkTJrj1RYsWuXVvW2TAX5MePSc33XRTobp336M+evS4RVsyR7xzEEQ/T955Hz799FN0d3erzy6SMoVdJBEKu0giFHaRRCjsIolQ2EUSobCLJCLcxbWaenp6sH///tx61G/21ghH2xpH1x31fL2+anSe70OHDrn1Tz75xK1Hc/PWy0drxqNz2q9evdqtb9261a17ffZoG+2oFx6dr9/brjq639Ga8qgXHo33+uxRD9/b4tt7TMJXdpJTSP6RZBvJD0n+MLt8LMm1JD/KPvpn/BeRUg3kbXwPgB+b2QwAtwL4Acl/AvAUgHVmNh3AuuxrEWlQYdjNrMPMNmWfHwPQBmASgIUAVmbfthKAf1yliJTqK/2BjuRUALMA/BnA1WbWAfT+hwBgfM6YZSRbSbZGv4OJSO0MOOwkRwD4PYAfmdnRgY4zsxYzazaz5qKLB0SkcgMKO8kh6A36b8xsVXZxJ8mmrN4EIP/P7CJSurD1xt4ewUsA2szsZ31KawAsBbA8+/hadF3d3d3Yu3dvbj1abtve3p5bGz58uDs2OqVy1MY5ePBgbu3AgQPu2MGD/Yc5Wl4btXm8ZabRKY2jpZze/QaAGTNmuPXjx4/n1qJ26OHDh9169Lh5c/fackDcmovGR1s2e0uLjxw54o6dOXNmbm3btm25tYH02ecA+B6ArSQ3Z5c9jd6Q/47kowD+DuA7A7guESlJGHYz+18AeUcAfKu60xGRWtHhsiKJUNhFEqGwiyRCYRdJhMIukoi6LnE9efIkNm/enFtftWpVbg0AHnnkkdxadLrlaHvfaCmot8w06oNHPdfoyMJoS2hveW+0VXV0bEO0lXVHR0fF1x/NLTo+ochzVnT5bJHltYDfx582bZo7trOzs6Lb1Su7SCIUdpFEKOwiiVDYRRKhsIskQmEXSYTCLpKIum7ZTLLQjd1zzz25tSeffNIdO358v2fN+kK0btvrq0b94qhPHvXZo36zd/3eKYuBuM8eHUMQ1b37Fo2N5h7xxnu96oGInrPoVNLeevYtW7a4YxcvXuzWzUxbNoukTGEXSYTCLpIIhV0kEQq7SCIUdpFEKOwiiah7n907T3nUmyzizjvvdOvPPfecW/f69KNGjXLHRudmj/rwUZ896vN7vC20gbgP7+0DAPjPaVdXlzs2elwi3tyj9ebROv7oOV27dq1bb2try62tX7/eHRtRn10kcQq7SCIUdpFEKOwiiVDYRRKhsIskQmEXSUTYZyc5BcCvAUwAcA5Ai5n9F8lnAPwbgPObkz9tZm8G11W/pn4d3XDDDW696N7wkydPduu7d+/OrUX95J07d7p1+frJ67MPZJOIHgA/NrNNJEcC+IDk+SMGfm5m/1mtSYpI7Qxkf/YOAB3Z58dItgGYVOuJiUh1faXf2UlOBTALwJ+zi54guYXkyyTH5IxZRrKVZGuhmYpIIQMOO8kRAH4P4EdmdhTALwB8A8BM9L7y/7S/cWbWYmbNZtZchfmKSIUGFHaSQ9Ab9N+Y2SoAMLNOMztrZucA/BLA7NpNU0SKCsPO3lN0vgSgzcx+1ufypj7f9m0A26o/PRGploG03uYC+BOArehtvQHA0wCWoPctvAHYDeD72R/zvOu6KFtvIo0kr/X2tTpvvIjEtJ5dJHEKu0giFHaRRCjsIolQ2EUSobCLJEJhF0mEwi6SCIVdJBEKu0giFHaRRCjsIolQ2EUSobCLJGIgZ5etpoMAPunz9bjsskbUqHNr1HkBmlulqjm3a/IKdV3P/qUbJ1sb9dx0jTq3Rp0XoLlVql5z09t4kUQo7CKJKDvsLSXfvqdR59ao8wI0t0rVZW6l/s4uIvVT9iu7iNSJwi6SiFLCTnIByb+S3EHyqTLmkIfkbpJbSW4ue3+6bA+9/SS39blsLMm1JD/KPva7x15Jc3uG5N7ssdtM8t6S5jaF5B9JtpH8kOQPs8tLfeycedXlcav77+wkBwH4G4B5ANoBbASwxMy213UiOUjuBtBsZqUfgEHyDgBdAH5tZv+cXfY8gENmtjz7j3KMmf17g8ztGQBdZW/jne1W1NR3m3EAiwA8jBIfO2dei1GHx62MV/bZAHaY2S4z6wbwWwALS5hHwzOzdwEcuuDihQBWZp+vRO8PS93lzK0hmFmHmW3KPj8G4Pw246U+ds686qKMsE8CsKfP1+1orP3eDcAfSH5AclnZk+nH1ee32co+ji95PhcKt/Gupwu2GW+Yx66S7c+LKiPs/W1N00j9vzlm9q8A7gHwg+ztqgzMgLbxrpd+thlvCJVuf15UGWFvBzClz9eTAewrYR79MrN92cf9AFaj8bai7jy/g272cX/J8/lCI23j3d8242iAx67M7c/LCPtGANNJTiM5FMB3AawpYR5fQnJ49ocTkBwOYD4abyvqNQCWZp8vBfBaiXP5B42yjXfeNuMo+bErfftzM6v7PwD3ovcv8jsB/EcZc8iZ17UA/i/792HZcwPwKnrf1p1B7zuiRwFcCWAdgI+yj2MbaG7/jd6tvbegN1hNJc1tLnp/NdwCYHP2796yHztnXnV53HS4rEgidASdSCIUdpFEKOwiiVDYRRKhsIskQmEXSYTCLpKI/wfWXDGbEgNvhQAAAABJRU5ErkJggg==\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(X[0].reshape((28,28))), cmap='gray')" ] }, { "cell_type": "code", "execution_count": 212, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 212, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(corrupt(X[0], var=0.1).reshape((28,28))), cmap='gray')" ] }, { "cell_type": "code", "execution_count": 213, "metadata": {}, "outputs": [], "source": [ "X_corrupt = corrupt(X)" ] }, { "cell_type": "code", "execution_count": 214, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 0.306\n", "epoch: 0, batch: 100 // loss: 0.235\n", "epoch: 0, batch: 200 // loss: 0.204\n", "epoch: 0, batch: 300 // loss: 0.184\n", "epoch: 0, batch: 400 // loss: 0.186\n", "epoch: 0, batch: 500 // loss: 0.175\n", "epoch: 0, batch: 600 // loss: 0.171\n", "epoch: 0, batch: 700 // loss: 0.168\n", "epoch: 0, batch: 800 // loss: 0.141\n", "epoch: 0, batch: 900 // loss: 0.162\n", "epoch: 0, batch: 1000 // loss: 0.131\n", "epoch: 0, batch: 1100 // loss: 0.140\n", "epoch: 0, batch: 1200 // loss: 0.108\n", "epoch: 0, batch: 1300 // loss: 0.120\n", "epoch: 0, batch: 1400 // loss: 0.095\n", "epoch: 0, batch: 1500 // loss: 0.092\n", "epoch: 0, batch: 1600 // loss: 0.097\n", "epoch: 0, batch: 1700 // loss: 0.090\n", "epoch: 0, batch: 1800 // loss: 0.095\n", "epoch: 0, batch: 1900 // loss: 0.086\n", "epoch: 0, batch: 2000 // loss: 0.077\n", "epoch: 0, batch: 2100 // loss: 0.084\n", "epoch: 0, batch: 2200 // loss: 0.091\n", "epoch: 0, batch: 2300 // loss: 0.083\n", "epoch: 0, batch: 2400 // loss: 0.073\n", "epoch: 0, batch: 2500 // loss: 0.070\n", "epoch: 0, batch: 2600 // loss: 0.080\n", "epoch: 0, batch: 2700 // loss: 0.070\n", "epoch: 0, batch: 2800 // loss: 0.084\n", "epoch: 0, batch: 2900 // loss: 0.068\n", "epoch: 0, batch: 3000 // loss: 0.070\n", "epoch: 0, batch: 3100 // loss: 0.075\n", "epoch: 0, batch: 3200 // loss: 0.071\n", "epoch: 0, batch: 3300 // loss: 0.068\n", "epoch: 0, batch: 3400 // loss: 0.066\n", "epoch: 0, batch: 3500 // loss: 0.067\n", "epoch: 0, batch: 3600 // loss: 0.076\n", "epoch: 0, batch: 3700 // loss: 0.079\n", "\n", "epoch: 1, batch: 0 // loss: 0.085\n", "epoch: 1, batch: 100 // loss: 0.074\n", "epoch: 1, batch: 200 // loss: 0.078\n", "epoch: 1, batch: 300 // loss: 0.077\n", "epoch: 1, batch: 400 // loss: 0.076\n", "epoch: 1, batch: 500 // loss: 0.065\n", "epoch: 1, batch: 600 // loss: 0.067\n", "epoch: 1, batch: 700 // loss: 0.071\n", "epoch: 1, batch: 800 // loss: 0.074\n", "epoch: 1, batch: 900 // loss: 0.080\n", "epoch: 1, batch: 1000 // loss: 0.065\n", "epoch: 1, batch: 1100 // loss: 0.071\n", "epoch: 1, batch: 1200 // loss: 0.074\n", "epoch: 1, batch: 1300 // loss: 0.075\n", "epoch: 1, batch: 1400 // loss: 0.069\n", "epoch: 1, batch: 1500 // loss: 0.074\n", "epoch: 1, batch: 1600 // loss: 0.076\n", "epoch: 1, batch: 1700 // loss: 0.071\n", "epoch: 1, batch: 1800 // loss: 0.076\n", "epoch: 1, batch: 1900 // loss: 0.072\n", "epoch: 1, batch: 2000 // loss: 0.069\n", "epoch: 1, batch: 2100 // loss: 0.076\n", "epoch: 1, batch: 2200 // loss: 0.079\n", "epoch: 1, batch: 2300 // loss: 0.074\n", "epoch: 1, batch: 2400 // loss: 0.068\n", "epoch: 1, batch: 2500 // loss: 0.065\n", "epoch: 1, batch: 2600 // loss: 0.071\n", "epoch: 1, batch: 2700 // loss: 0.065\n", "epoch: 1, batch: 2800 // loss: 0.075\n", "epoch: 1, batch: 2900 // loss: 0.063\n", "epoch: 1, batch: 3000 // loss: 0.065\n", "epoch: 1, batch: 3100 // loss: 0.068\n", "epoch: 1, batch: 3200 // loss: 0.065\n", "epoch: 1, batch: 3300 // loss: 0.063\n", "epoch: 1, batch: 3400 // loss: 0.062\n", "epoch: 1, batch: 3500 // loss: 0.060\n", "epoch: 1, batch: 3600 // loss: 0.069\n", "epoch: 1, batch: 3700 // loss: 0.072\n", "\n", "epoch: 2, batch: 0 // loss: 0.078\n", "epoch: 2, batch: 100 // loss: 0.069\n", "epoch: 2, batch: 200 // loss: 0.071\n", "epoch: 2, batch: 300 // loss: 0.071\n", "epoch: 2, batch: 400 // loss: 0.070\n", "epoch: 2, batch: 500 // loss: 0.060\n", "epoch: 2, batch: 600 // loss: 0.062\n", "epoch: 2, batch: 700 // loss: 0.065\n", "epoch: 2, batch: 800 // loss: 0.067\n", "epoch: 2, batch: 900 // loss: 0.073\n", "epoch: 2, batch: 1000 // loss: 0.061\n", "epoch: 2, batch: 1100 // loss: 0.065\n", "epoch: 2, batch: 1200 // loss: 0.068\n", "epoch: 2, batch: 1300 // loss: 0.068\n", "epoch: 2, batch: 1400 // loss: 0.063\n", "epoch: 2, batch: 1500 // loss: 0.069\n", "epoch: 2, batch: 1600 // loss: 0.070\n", "epoch: 2, batch: 1700 // loss: 0.064\n", "epoch: 2, batch: 1800 // loss: 0.071\n", "epoch: 2, batch: 1900 // loss: 0.065\n", "epoch: 2, batch: 2000 // loss: 0.064\n", "epoch: 2, batch: 2100 // loss: 0.069\n", "epoch: 2, batch: 2200 // loss: 0.072\n", "epoch: 2, batch: 2300 // loss: 0.068\n", "epoch: 2, batch: 2400 // loss: 0.061\n", "epoch: 2, batch: 2500 // loss: 0.059\n", "epoch: 2, batch: 2600 // loss: 0.065\n", "epoch: 2, batch: 2700 // loss: 0.059\n", "epoch: 2, batch: 2800 // loss: 0.067\n", "epoch: 2, batch: 2900 // loss: 0.057\n", "epoch: 2, batch: 3000 // loss: 0.060\n", "epoch: 2, batch: 3100 // loss: 0.061\n", "epoch: 2, batch: 3200 // loss: 0.057\n", "epoch: 2, batch: 3300 // loss: 0.056\n", "epoch: 2, batch: 3400 // loss: 0.056\n", "epoch: 2, batch: 3500 // loss: 0.053\n", "epoch: 2, batch: 3600 // loss: 0.061\n", "epoch: 2, batch: 3700 // loss: 0.064\n", "\n", "epoch: 3, batch: 0 // loss: 0.070\n", "epoch: 3, batch: 100 // loss: 0.062\n", "epoch: 3, batch: 200 // loss: 0.064\n", "epoch: 3, batch: 300 // loss: 0.064\n", "epoch: 3, batch: 400 // loss: 0.062\n", "epoch: 3, batch: 500 // loss: 0.054\n", "epoch: 3, batch: 600 // loss: 0.055\n", "epoch: 3, batch: 700 // loss: 0.059\n", "epoch: 3, batch: 800 // loss: 0.059\n", "epoch: 3, batch: 900 // loss: 0.065\n", "epoch: 3, batch: 1000 // loss: 0.056\n", "epoch: 3, batch: 1100 // loss: 0.058\n", "epoch: 3, batch: 1200 // loss: 0.060\n", "epoch: 3, batch: 1300 // loss: 0.061\n", "epoch: 3, batch: 1400 // loss: 0.057\n", "epoch: 3, batch: 1500 // loss: 0.062\n", "epoch: 3, batch: 1600 // loss: 0.064\n", "epoch: 3, batch: 1700 // loss: 0.058\n", "epoch: 3, batch: 1800 // loss: 0.065\n", "epoch: 3, batch: 1900 // loss: 0.058\n", "epoch: 3, batch: 2000 // loss: 0.058\n", "epoch: 3, batch: 2100 // loss: 0.060\n", "epoch: 3, batch: 2200 // loss: 0.065\n", "epoch: 3, batch: 2300 // loss: 0.061\n", "epoch: 3, batch: 2400 // loss: 0.054\n", "epoch: 3, batch: 2500 // loss: 0.053\n", "epoch: 3, batch: 2600 // loss: 0.058\n", "epoch: 3, batch: 2700 // loss: 0.054\n", "epoch: 3, batch: 2800 // loss: 0.059\n", "epoch: 3, batch: 2900 // loss: 0.051\n", "epoch: 3, batch: 3000 // loss: 0.055\n", "epoch: 3, batch: 3100 // loss: 0.054\n", "epoch: 3, batch: 3200 // loss: 0.050\n", "epoch: 3, batch: 3300 // loss: 0.049\n", "epoch: 3, batch: 3400 // loss: 0.051\n", "epoch: 3, batch: 3500 // loss: 0.047\n", "epoch: 3, batch: 3600 // loss: 0.055\n", "epoch: 3, batch: 3700 // loss: 0.056\n", "\n", "epoch: 4, batch: 0 // loss: 0.064\n", "epoch: 4, batch: 100 // loss: 0.056\n", "epoch: 4, batch: 200 // loss: 0.057\n", "epoch: 4, batch: 300 // loss: 0.058\n", "epoch: 4, batch: 400 // loss: 0.056\n", "epoch: 4, batch: 500 // loss: 0.048\n", "epoch: 4, batch: 600 // loss: 0.050\n", "epoch: 4, batch: 700 // loss: 0.054\n", "epoch: 4, batch: 800 // loss: 0.052\n", "epoch: 4, batch: 900 // loss: 0.059\n", "epoch: 4, batch: 1000 // loss: 0.052\n", "epoch: 4, batch: 1100 // loss: 0.052\n", "epoch: 4, batch: 1200 // loss: 0.054\n", "epoch: 4, batch: 1300 // loss: 0.055\n", "epoch: 4, batch: 1400 // loss: 0.052\n", "epoch: 4, batch: 1500 // loss: 0.057\n", "epoch: 4, batch: 1600 // loss: 0.060\n", "epoch: 4, batch: 1700 // loss: 0.053\n", "epoch: 4, batch: 1800 // loss: 0.060\n", "epoch: 4, batch: 1900 // loss: 0.053\n", "epoch: 4, batch: 2000 // loss: 0.053\n", "epoch: 4, batch: 2100 // loss: 0.054\n", "epoch: 4, batch: 2200 // loss: 0.060\n", "epoch: 4, batch: 2300 // loss: 0.056\n", "epoch: 4, batch: 2400 // loss: 0.048\n", "epoch: 4, batch: 2500 // loss: 0.048\n", "epoch: 4, batch: 2600 // loss: 0.053\n", "epoch: 4, batch: 2700 // loss: 0.050\n", "epoch: 4, batch: 2800 // loss: 0.053\n", "epoch: 4, batch: 2900 // loss: 0.047\n", "epoch: 4, batch: 3000 // loss: 0.051\n", "epoch: 4, batch: 3100 // loss: 0.050\n", "epoch: 4, batch: 3200 // loss: 0.045\n", "epoch: 4, batch: 3300 // loss: 0.045\n", "epoch: 4, batch: 3400 // loss: 0.048\n", "epoch: 4, batch: 3500 // loss: 0.042\n", "epoch: 4, batch: 3600 // loss: 0.050\n", "epoch: 4, batch: 3700 // loss: 0.051\n", "\n", "epoch: 5, batch: 0 // loss: 0.059\n", "epoch: 5, batch: 100 // loss: 0.052\n", "epoch: 5, batch: 200 // loss: 0.052\n", "epoch: 5, batch: 300 // loss: 0.054\n", "epoch: 5, batch: 400 // loss: 0.052\n", "epoch: 5, batch: 500 // loss: 0.045\n", "epoch: 5, batch: 600 // loss: 0.046\n", "epoch: 5, batch: 700 // loss: 0.050\n", "epoch: 5, batch: 800 // loss: 0.048\n", "epoch: 5, batch: 900 // loss: 0.055\n", "epoch: 5, batch: 1000 // loss: 0.049\n", "epoch: 5, batch: 1100 // loss: 0.049\n", "epoch: 5, batch: 1200 // loss: 0.050\n", "epoch: 5, batch: 1300 // loss: 0.051\n", "epoch: 5, batch: 1400 // loss: 0.048\n", "epoch: 5, batch: 1500 // loss: 0.054\n", "epoch: 5, batch: 1600 // loss: 0.056\n", "epoch: 5, batch: 1700 // loss: 0.050\n", "epoch: 5, batch: 1800 // loss: 0.057\n", "epoch: 5, batch: 1900 // loss: 0.050\n", "epoch: 5, batch: 2000 // loss: 0.050\n", "epoch: 5, batch: 2100 // loss: 0.051\n", "epoch: 5, batch: 2200 // loss: 0.056\n", "epoch: 5, batch: 2300 // loss: 0.053\n", "epoch: 5, batch: 2400 // loss: 0.045\n", "epoch: 5, batch: 2500 // loss: 0.045\n", "epoch: 5, batch: 2600 // loss: 0.050\n", "epoch: 5, batch: 2700 // loss: 0.047\n", "epoch: 5, batch: 2800 // loss: 0.050\n", "epoch: 5, batch: 2900 // loss: 0.044\n", "epoch: 5, batch: 3000 // loss: 0.049\n", "epoch: 5, batch: 3100 // loss: 0.047\n", "epoch: 5, batch: 3200 // loss: 0.042\n", "epoch: 5, batch: 3300 // loss: 0.042\n", "epoch: 5, batch: 3400 // loss: 0.045\n", "epoch: 5, batch: 3500 // loss: 0.039\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 5, batch: 3600 // loss: 0.047\n", "epoch: 5, batch: 3700 // loss: 0.048\n", "\n", "epoch: 6, batch: 0 // loss: 0.056\n", "epoch: 6, batch: 100 // loss: 0.049\n", "epoch: 6, batch: 200 // loss: 0.049\n", "epoch: 6, batch: 300 // loss: 0.052\n", "epoch: 6, batch: 400 // loss: 0.049\n", "epoch: 6, batch: 500 // loss: 0.043\n", "epoch: 6, batch: 600 // loss: 0.044\n", "epoch: 6, batch: 700 // loss: 0.048\n", "epoch: 6, batch: 800 // loss: 0.045\n", "epoch: 6, batch: 900 // loss: 0.052\n", "epoch: 6, batch: 1000 // loss: 0.047\n", "epoch: 6, batch: 1100 // loss: 0.046\n", "epoch: 6, batch: 1200 // loss: 0.048\n", "epoch: 6, batch: 1300 // loss: 0.048\n", "epoch: 6, batch: 1400 // loss: 0.046\n", "epoch: 6, batch: 1500 // loss: 0.052\n", "epoch: 6, batch: 1600 // loss: 0.054\n", "epoch: 6, batch: 1700 // loss: 0.048\n", "epoch: 6, batch: 1800 // loss: 0.055\n", "epoch: 6, batch: 1900 // loss: 0.047\n", "epoch: 6, batch: 2000 // loss: 0.048\n", "epoch: 6, batch: 2100 // loss: 0.049\n", "epoch: 6, batch: 2200 // loss: 0.053\n", "epoch: 6, batch: 2300 // loss: 0.051\n", "epoch: 6, batch: 2400 // loss: 0.043\n", "epoch: 6, batch: 2500 // loss: 0.043\n", "epoch: 6, batch: 2600 // loss: 0.048\n", "epoch: 6, batch: 2700 // loss: 0.046\n", "epoch: 6, batch: 2800 // loss: 0.048\n", "epoch: 6, batch: 2900 // loss: 0.043\n", "epoch: 6, batch: 3000 // loss: 0.047\n", "epoch: 6, batch: 3100 // loss: 0.045\n", "epoch: 6, batch: 3200 // loss: 0.040\n", "epoch: 6, batch: 3300 // loss: 0.040\n", "epoch: 6, batch: 3400 // loss: 0.044\n", "epoch: 6, batch: 3500 // loss: 0.037\n", "epoch: 6, batch: 3600 // loss: 0.045\n", "epoch: 6, batch: 3700 // loss: 0.045\n", "\n", "epoch: 7, batch: 0 // loss: 0.054\n", "epoch: 7, batch: 100 // loss: 0.047\n", "epoch: 7, batch: 200 // loss: 0.046\n", "epoch: 7, batch: 300 // loss: 0.050\n", "epoch: 7, batch: 400 // loss: 0.047\n", "epoch: 7, batch: 500 // loss: 0.041\n", "epoch: 7, batch: 600 // loss: 0.042\n", "epoch: 7, batch: 700 // loss: 0.046\n", "epoch: 7, batch: 800 // loss: 0.043\n", "epoch: 7, batch: 900 // loss: 0.050\n", "epoch: 7, batch: 1000 // loss: 0.046\n", "epoch: 7, batch: 1100 // loss: 0.044\n", "epoch: 7, batch: 1200 // loss: 0.046\n", "epoch: 7, batch: 1300 // loss: 0.046\n", "epoch: 7, batch: 1400 // loss: 0.044\n", "epoch: 7, batch: 1500 // loss: 0.050\n", "epoch: 7, batch: 1600 // loss: 0.052\n", "epoch: 7, batch: 1700 // loss: 0.046\n", "epoch: 7, batch: 1800 // loss: 0.053\n", "epoch: 7, batch: 1900 // loss: 0.046\n", "epoch: 7, batch: 2000 // loss: 0.046\n", "epoch: 7, batch: 2100 // loss: 0.047\n", "epoch: 7, batch: 2200 // loss: 0.051\n", "epoch: 7, batch: 2300 // loss: 0.049\n", "epoch: 7, batch: 2400 // loss: 0.042\n", "epoch: 7, batch: 2500 // loss: 0.042\n", "epoch: 7, batch: 2600 // loss: 0.046\n", "epoch: 7, batch: 2700 // loss: 0.044\n", "epoch: 7, batch: 2800 // loss: 0.046\n", "epoch: 7, batch: 2900 // loss: 0.041\n", "epoch: 7, batch: 3000 // loss: 0.046\n", "epoch: 7, batch: 3100 // loss: 0.044\n", "epoch: 7, batch: 3200 // loss: 0.039\n", "epoch: 7, batch: 3300 // loss: 0.038\n", "epoch: 7, batch: 3400 // loss: 0.042\n", "epoch: 7, batch: 3500 // loss: 0.035\n", "epoch: 7, batch: 3600 // loss: 0.044\n", "epoch: 7, batch: 3700 // loss: 0.044\n", "\n", "epoch: 8, batch: 0 // loss: 0.052\n", "epoch: 8, batch: 100 // loss: 0.046\n", "epoch: 8, batch: 200 // loss: 0.045\n", "epoch: 8, batch: 300 // loss: 0.048\n", "epoch: 8, batch: 400 // loss: 0.045\n", "epoch: 8, batch: 500 // loss: 0.040\n", "epoch: 8, batch: 600 // loss: 0.041\n", "epoch: 8, batch: 700 // loss: 0.045\n", "epoch: 8, batch: 800 // loss: 0.041\n", "epoch: 8, batch: 900 // loss: 0.049\n", "epoch: 8, batch: 1000 // loss: 0.044\n", "epoch: 8, batch: 1100 // loss: 0.043\n", "epoch: 8, batch: 1200 // loss: 0.045\n", "epoch: 8, batch: 1300 // loss: 0.044\n", "epoch: 8, batch: 1400 // loss: 0.042\n", "epoch: 8, batch: 1500 // loss: 0.048\n", "epoch: 8, batch: 1600 // loss: 0.051\n", "epoch: 8, batch: 1700 // loss: 0.045\n", "epoch: 8, batch: 1800 // loss: 0.052\n", "epoch: 8, batch: 1900 // loss: 0.044\n", "epoch: 8, batch: 2000 // loss: 0.045\n", "epoch: 8, batch: 2100 // loss: 0.046\n", "epoch: 8, batch: 2200 // loss: 0.050\n", "epoch: 8, batch: 2300 // loss: 0.048\n", "epoch: 8, batch: 2400 // loss: 0.041\n", "epoch: 8, batch: 2500 // loss: 0.041\n", "epoch: 8, batch: 2600 // loss: 0.045\n", "epoch: 8, batch: 2700 // loss: 0.043\n", "epoch: 8, batch: 2800 // loss: 0.044\n", "epoch: 8, batch: 2900 // loss: 0.040\n", "epoch: 8, batch: 3000 // loss: 0.044\n", "epoch: 8, batch: 3100 // loss: 0.042\n", "epoch: 8, batch: 3200 // loss: 0.037\n", "epoch: 8, batch: 3300 // loss: 0.037\n", "epoch: 8, batch: 3400 // loss: 0.041\n", "epoch: 8, batch: 3500 // loss: 0.034\n", "epoch: 8, batch: 3600 // loss: 0.043\n", "epoch: 8, batch: 3700 // loss: 0.042\n", "\n", "epoch: 9, batch: 0 // loss: 0.051\n", "epoch: 9, batch: 100 // loss: 0.045\n", "epoch: 9, batch: 200 // loss: 0.043\n", "epoch: 9, batch: 300 // loss: 0.047\n", "epoch: 9, batch: 400 // loss: 0.044\n", "epoch: 9, batch: 500 // loss: 0.039\n", "epoch: 9, batch: 600 // loss: 0.039\n", "epoch: 9, batch: 700 // loss: 0.044\n", "epoch: 9, batch: 800 // loss: 0.040\n", "epoch: 9, batch: 900 // loss: 0.048\n", "epoch: 9, batch: 1000 // loss: 0.043\n", "epoch: 9, batch: 1100 // loss: 0.042\n", "epoch: 9, batch: 1200 // loss: 0.043\n", "epoch: 9, batch: 1300 // loss: 0.043\n", "epoch: 9, batch: 1400 // loss: 0.041\n", "epoch: 9, batch: 1500 // loss: 0.047\n", "epoch: 9, batch: 1600 // loss: 0.049\n", "epoch: 9, batch: 1700 // loss: 0.044\n", "epoch: 9, batch: 1800 // loss: 0.051\n", "epoch: 9, batch: 1900 // loss: 0.043\n", "epoch: 9, batch: 2000 // loss: 0.043\n", "epoch: 9, batch: 2100 // loss: 0.045\n", "epoch: 9, batch: 2200 // loss: 0.048\n", "epoch: 9, batch: 2300 // loss: 0.047\n", "epoch: 9, batch: 2400 // loss: 0.040\n", "epoch: 9, batch: 2500 // loss: 0.040\n", "epoch: 9, batch: 2600 // loss: 0.044\n", "epoch: 9, batch: 2700 // loss: 0.042\n", "epoch: 9, batch: 2800 // loss: 0.043\n", "epoch: 9, batch: 2900 // loss: 0.039\n", "epoch: 9, batch: 3000 // loss: 0.043\n", "epoch: 9, batch: 3100 // loss: 0.042\n", "epoch: 9, batch: 3200 // loss: 0.036\n", "epoch: 9, batch: 3300 // loss: 0.036\n", "epoch: 9, batch: 3400 // loss: 0.040\n", "epoch: 9, batch: 3500 // loss: 0.033\n", "epoch: 9, batch: 3600 // loss: 0.041\n", "epoch: 9, batch: 3700 // loss: 0.041\n" ] } ], "source": [ "auto3 = AE2(hidden_size=16)\n", "optimizer = optim.SGD(auto3.parameters(), lr=0.01, momentum=0.9)\n", "train_AE(X_corrupt, X, auto3, optimizer, loss_function)" ] }, { "cell_type": "code", "execution_count": 215, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 215, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "Zs = auto3(X[:5000].float(), return_z=True).detach().numpy()\n", "plt.scatter(Zs[:,0], Zs[:,1], c=c)" ] }, { "cell_type": "code", "execution_count": 216, "metadata": {}, "outputs": [], "source": [ "X_tilde = auto3(X[:5000].float()).detach().numpy()" ] }, { "cell_type": "code", "execution_count": 222, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 222, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAAVYklEQVR4nO3dXWzc5ZUG8OfYhHwnxEmcTyshiaWQLNoQWdFKLAuralvKDfSiq3JRsRLa9KJIrdSLRexFuUSrbaterCqlC2q66lJVahFcoN0iVAn1psKgAMk6cT5NnDh2MPmEfDpnLzxILvj/PGbGnhn1fX5SZMcn78zr/8zJjH3e97yRmTCzv3wdrZ6AmTWHk92sEE52s0I42c0K4WQ3K8Rdzbyzjo6O7OzsrIzPnz+/7tu+ffs2jbP7BYCODv7/Hrt9NVZVPO6++24aX7x4MY2z+79z5w4dq66Lmnsj1Rx13W7evEnj165dq3u8+r4jgsbVdVXj2XVr5DG7ceMGbt26Ne2dN5TsEfEogJ8C6ATwn5n5gprkypUrK+ObN29W91cZ++ijj+jYe+65h8YXLFhA4xcvXqyMLVq0iI5VT9pNmzbR+J49e2ic/Sf5ySef0LHLly+ncfWfqIqzx0xdt6GhIRo/dOgQjZ8+fboytmTJEjpWPR+uXLlC4+qFiz0nrl+/Tseyx+zAgQOVsbrfxkdEJ4D/APB1ADsAPBkRO+q9PTObW438zL4HwLHMPJGZNwH8GsDjszMtM5ttjST7BgBT3ycN1772ZyJib0T0R0S/+lnEzOZOI8k+3Q9jX/itQ2buy8y+zOxTv5Axs7nTSPYNA+iZ8veNAM42Nh0zmyuNJPvbAHoj4t6IuBvAtwC8NjvTMrPZVnfpLTNvR8QzAP4Xk6W3lzKT1kLmzZuHNWvWVMZV7ZOVM+6991469uOPP6ZxZdWqVZUxVWtevXo1je/evZvGv/a1r9E4m5u6pmvXrqXxsbExGlc/mrE4K40BwM6dO2lclVvZ+gVVDh0fH6dxdV3V7bPnslp3weY2MTFRGWuozp6ZrwN4vZHbMLPm8G/MzArhZDcrhJPdrBBOdrNCONnNCuFkNytEU/ez33XXXXSLayO18DNnztC42tI4b968uu+bbX8FgPXr19N4T08Pjau5sZru0qVL6x4LAF1dXTSurvutW7cqYzdu3KBjVZyt2QB4zfno0aN0rPq+VS18eHiYxtnWXzZvgPc3YOsa/MpuVggnu1khnOxmhXCymxXCyW5WCCe7WSGaWnqbmJig3U5VmYh1MlWdaVWJSW3VZKWWbdu20bGNtnO+fPly3bd/6dIlOlZ13VWdTlVJs5GWySquWkmz712NVd1h1fZa1bWXfW+sXAlMlrCrsJKeX9nNCuFkNyuEk92sEE52s0I42c0K4WQ3K4ST3awQTa2zA7y+qLZystbDanvsihUraLyRI53PnTtHx6otrI2sLwD4VlDWZhrQ9Wb1mKjTTNnjrWr8Fy5coPEdO/g5oqOjo5UxdV3U+gRFjWf1cPVcHRwcrIyxGr1f2c0K4WQ3K4ST3awQTnazQjjZzQrhZDcrhJPdrBBNrbN3dHRgwYIFlXFVs92yZUtlTB2xy+qaAPDpp5/SOKsXq+OiVR1d1emXLVtG42yNgGpzreroau6qlTS77mpthNpTzuro6vbVc01932rPuepBwPo6sBjA1yecP3++MtZQskfEKQBXAEwAuJ2ZfY3cnpnNndl4Zf/7zORtO8ys5fwzu1khGk32BPD7iHgnIvZO9w8iYm9E9EdEv/o5x8zmTqNv4x/MzLMR0Q3gjYg4nJlvTf0HmbkPwD4AWLp0aXX3QTObUw29smfm2drHMQCvANgzG5Mys9lXd7JHxOKIWPrZ5wC+CuDgbE3MzGZXI2/j1wB4pVZHvQvAf2fm/7ABt2/fpnuU2VG0AN/PvnXrVjp2ZGSExtlR0gCvyzbaF56tPQB0z3u2313V6FX/c/W9qTo922uvxqq99gsXLqRxdl3Vugr1mLF6NqCPk2b9EdTc2HVj6xrqTvbMPAHgr+sdb2bN5dKbWSGc7GaFcLKbFcLJblYIJ7tZIZreSpod4Xv16lU6lh2bPDQ0RMf29vbSuDqamJWBJiYm6NhGlwl3d3fTOJubKp2pNtdqi6zaOszKRGNjYw3dtmqxzUq5qk318PAwjatSrbpu9R67DPCtvz6y2cyc7GalcLKbFcLJblYIJ7tZIZzsZoVwspsVoql19nnz5mHdunWV8ePHj9Px6phdhm2PBXjdE+A1W7ZdEdBbOVVLZbX+gNVW1X2rerOqZbO1DwBfg7B69Wo69vDhwzSuWi6z+1bXVB0nrWrhKs6ox4xtgWXrKvzKblYIJ7tZIZzsZoVwspsVwsluVggnu1khnOxmhWhqnf3OnTu0NrpkyRI6nh1tvHbtWjpWtedV9WTWElkd76vaCquarNobvXz58rpvWx1d/OGHH9L4Qw89ROPs2qi1D6qGr+Ls+aTGqjo868sAABs3bqRxdtS1ah3OWmR7P7uZOdnNSuFkNyuEk92sEE52s0I42c0K4WQ3K0RT6+wdHR10X7iqfbJ94+roYVXrPnHiRN3j1b5qVqMHdI1/w4YNNK5q5Yzai6/6oy9atIjG2WOqjlxW6xfU3FktXN23ei6qswDU2gjW63/Hjh10LFufwL5n+coeES9FxFhEHJzyta6IeCMijtY+rlC3Y2atNZO38b8A8OjnvvYsgDczsxfAm7W/m1kbk8memW8B+HzfpMcB7K99vh/AE7M8LzObZfX+gm5NZo4AQO1j5WFkEbE3Ivojor/RM8/MrH5z/tv4zNyXmX2Z2aca6ZnZ3Kk32UcjYh0A1D7y4zjNrOXqTfbXADxV+/wpAK/OznTMbK7IOntEvAzgEQCrImIYwA8BvADgNxHxNIAPAXxzJnem9rOrejH7mV/VRdXe6a6uLhpne6PVXnlVL1Z7zlVf+fXr11fGVP9zdc3V96bWELDrtmIFr9iqGj/rCw/w66rWNoyPj9O4uq7qHAK2dkKNZWsb2NoDmeyZ+WRF6CtqrJm1Dy+XNSuEk92sEE52s0I42c0K4WQ3K0RTt7hOTEzg8uXLlfHz58/T8fPnz6+MqVbSqpQyNsbXBbGjplVpTZXOtm/fTuNqe+7mzZsrY9evX6djVZlHleZ6enpo/NKlS5UxVf5S140dTwzwFtuqbKdKa6okuWzZMhpn7aDV9ljWarqhLa5m9pfByW5WCCe7WSGc7GaFcLKbFcLJblYIJ7tZIZpaZwf4FjzVyYZtQ1V1T1bXBHQtm9V01fG8Ks7aCgO6Ds/WCKijhVUbbFVnV+sTWL1a1dnVY6bi7DmhjgdX6xPU9lv1mLIt2eoxYe3YWX75ld2sEE52s0I42c0K4WQ3K4ST3awQTnazQjjZzQrR1Dp7ZtL65ZYtW+h4VrtUe5tVXVRh+5/ZPntAt1tWbbAvXLhA46xmrGq26qhrtfZBHdms5s6o9t5qLz773tVxz+r5NDQ0ROOqjn/u3LnKGKujA3ovfhW/spsVwsluVggnu1khnOxmhXCymxXCyW5WCCe7WSGaWmfv7Oyk+5tV7ZPVF1VddHR0lMbZEboA7w2/cOFCOpYdNQ0AW7dupXE1d9YfncUAoLu7m8ZVTVf1OGfrG06dOkXHqjq6mltnZ2fdY9VzUfWVX7VqFY2z56s6wpv1KGBj5St7RLwUEWMRcXDK156PiDMRcaD25zF1O2bWWjN5G/8LAI9O8/WfZOau2p/XZ3daZjbbZLJn5lsA+Dk8Ztb2GvkF3TMR8X7tbf6Kqn8UEXsjoj8i+lXPMTObO/Um+88AbAWwC8AIgB9V/cPM3JeZfZnZp37hYmZzp65kz8zRzJzIzDsAfg5gz+xOy8xmW13JHhFTzy/+BoCDVf/WzNqDfF8dES8DeATAqogYBvBDAI9ExC4ACeAUgO/M5M4yk54trfYAs3q1qk2qvfLsHHEAWLGi8tcSsre6Or99cHCQxu+//34aZ+eYqx+dVH9ztd9d7Vdn+93V2oaBgQEaV/u+WZ290eui1j6w5wsArF69ujKm+iMcPny4Msbq9zLZM/PJab78ohpnZu3Fy2XNCuFkNyuEk92sEE52s0I42c0K0VZbXFUJi5Vq1BbX06dP0zgrXwHApk2bKmOqZKjKNLt376ZxVd5i7Z7VscbquqmtnqpNNmsdfvXqVTpWtcFWba6Hh4crY6oV9OXLl2lctf9W14WVz9T2WJZDrNzoV3azQjjZzQrhZDcrhJPdrBBOdrNCONnNCuFkNytE01vHsLqu2hbIjrk9efIkHdvb20vjqqbL4qqt8MaNG2lc1eFZjR8Ali1bVhlj1wzQW4PZlmSA13UB/nirNmVqC+uRI0doXM2NUesLVPzs2bM0zrZcq7URrAU3e7z8ym5WCCe7WSGc7GaFcLKbFcLJblYIJ7tZIZzsZoVoap19YmKC7llXbYtZ+1/VKvrEiRM0rtr3sr3RrF0yAJw5c4bGWVthQNd02b5w1TJZ7btWLZXZdQGA++67rzKmjntWc1P7/FmtW9Xw2bHIgP6+t2/fTuPHjh2rjLF1E4Ben1DFr+xmhXCymxXCyW5WCCe7WSGc7GaFcLKbFcLJblaIptbZI4LWfbu6uuj48fHxypiq2ao6uupBPjExURlTe+HZvAFdp1c1YdbjXI1VaxtUf/Tu7m4aZ/Vo1Tf+vffeo3H1mLG4+r5VHwC1BkD1KGB50EhPerY+QL6yR0RPRPwhIgYi4lBEfK/29a6IeCMijtY+8s4TZtZSM3kbfxvADzLzPgB/A+C7EbEDwLMA3szMXgBv1v5uZm1KJntmjmTmu7XPrwAYALABwOMA9tf+2X4AT8zVJM2scV/qF3QRsRnAAwD+BGBNZo4Ak/8hAJj2h7eI2BsR/RHRX++aXjNr3IyTPSKWAPgtgO9nJj/1borM3JeZfZnZpzZlmNncmVGyR8Q8TCb6rzLzd7Uvj0bEulp8HYCxuZmimc0G+VIbk72GXwQwkJk/nhJ6DcBTAF6ofXxV3VZnZyfdvjcyMkLHsx8D1JHLS5cupXF1XPS6desqY6qV9MKFC2l8YGCAxlUbbEaVt9Tc1GMyODhI4w888EBlTB113dPTQ+PqutHji8W2YdWGWrV7ZkdVA8CaNWsqY2rrbr1m8r76QQDfBvBBRByofe05TCb5byLiaQAfAvjmnMzQzGaFTPbM/COAqpMEvjK70zGzueLlsmaFcLKbFcLJblYIJ7tZIZzsZoVoeitpth2TxQC+ZXHlypV0rNqSqLZLsnp1o8uAVSvpS5cu0TirR6vv+9NPP6VxVY9W2zEb2Rqs2jmr+2a1cnXfat2GWlvRyJbpVatW0bFqO3cVv7KbFcLJblYIJ7tZIZzsZoVwspsVwsluVggnu1kh2qp1jKpdsj3pR44caei+1f5l1mVHtSVme5cBvedcXRfWI4DVcwG+Tx/Qx02rmjBbg6COJlb3rWrZbI2AquFv27aNxtVjrlp4s/3uN2/epGNZ6/HJ9hPT8yu7WSGc7GaFcLKbFcLJblYIJ7tZIZzsZoVwspsVoql19sykdVfVi/vWrVuVMXUks6qjq+OiWS1c1cHVfS9fvpzGFdYHgF0zQPc3V3V4dfsrVlQf7qv6xh8/fpzG1fOFxdUx2Sp+4sQJGlf9FTZu3FgZa2QvPVsP4ld2s0I42c0K4WQ3K4ST3awQTnazQjjZzQrhZDcrxEzOZ+8B8EsAawHcAbAvM38aEc8D+GcA52v/9LnMfJ3dVkdHBz0PXNV8WY/zDRs20LHj4+N13zbA922reat926qHuTo7vru7uzKmequzsQAwNDRE43fu3KFx1hNf7eNnNXqA9zcAGttLf+DAARpX+9XV8+nUqVOVMbXmgz3f2OMxk0U1twH8IDPfjYilAN6JiDdqsZ9k5r/P4DbMrMVmcj77CICR2udXImIAAH8ZNbO286V+Zo+IzQAeAPCn2peeiYj3I+KliJj2PVdE7I2I/ojoV0srzWzuzDjZI2IJgN8C+H5mXgbwMwBbAezC5Cv/j6Ybl5n7MrMvM/tUzzAzmzszSvaImIfJRP9VZv4OADJzNDMnMvMOgJ8D2DN30zSzRslkj8l2lS8CGMjMH0/5+tTtUN8AcHD2p2dms2Umv41/EMC3AXwQEZ/VI54D8GRE7AKQAE4B+M5M7pBt91TbKU+ePFkZUy2T1RZYNZ619+3t7a17LKBLSI20klYloGvXrtH4zp07aVxt5WTbTNVx0mpuFy5coHG2jVSVS3fs2EHjqiSpnstse686opuVJFl+zeS38X8EMF0zalpTN7P24hV0ZoVwspsVwsluVggnu1khnOxmhXCymxWiqa2kJyYm6FZTVVdlWyJZC12AH98L6Pa9rA6vxl68eJHGVS387NmzNP7www9XxlSNf3BwkMZVLZxtIwWAsbGxytjw8DAde/jwYRofHR2l8XPnzlXGVC1b2bVrF42PjIzQOKvzs2OXAf6YsqOo/cpuVggnu1khnOxmhXCymxXCyW5WCCe7WSGc7GaFCFaXm/U7izgPYOpG4FUAPmraBL6cdp1bu84L8NzqNZtz25SZ0/bvbmqyf+HOI/ozs69lEyDadW7tOi/Ac6tXs+bmt/FmhXCymxWi1cm+r8X3z7Tr3Np1XoDnVq+mzK2lP7ObWfO0+pXdzJrEyW5WiJYke0Q8GhFHIuJYRDzbijlUiYhTEfFBRByIiP4Wz+WliBiLiINTvtYVEW9ExNHaR36ucXPn9nxEnKlduwMR8ViL5tYTEX+IiIGIOBQR36t9vaXXjsyrKdet6T+zR0QngEEA/wBgGMDbAJ7MzP9r6kQqRMQpAH2Z2fIFGBHxdwCuAvhlZv5V7Wv/BuDjzHyh9h/lisz8lzaZ2/MArrb6GO/aaUXrph4zDuAJAP+EFl47Mq9/RBOuWyte2fcAOJaZJzLzJoBfA3i8BfNoe5n5FoDPt8F5HMD+2uf7MflkabqKubWFzBzJzHdrn18B8Nkx4y29dmReTdGKZN8A4PSUvw+jvc57TwC/j4h3ImJvqyczjTWZOQJMPnkAdLd4Pp8nj/Fups8dM942166e488b1Ypkn67BVjvV/x7MzN0Avg7gu7W3qzYzMzrGu1mmOWa8LdR7/HmjWpHswwB6pvx9IwDeUbGJMvNs7eMYgFfQfkdRj352gm7tY3VHxyZrp2O8pztmHG1w7Vp5/Hkrkv1tAL0RcW9E3A3gWwBea8E8viAiFtd+cYKIWAzgq2i/o6hfA/BU7fOnALzawrn8mXY5xrvqmHG0+Nq1/PjzzGz6HwCPYfI38scB/Gsr5lAxry0A3qv9OdTquQF4GZNv625h8h3R0wBWAngTwNHax642mtt/AfgAwPuYTKx1LZrb32LyR8P3ARyo/Xms1deOzKsp183LZc0K4RV0ZoVwspsVwsluVggnu1khnOxmhXCymxXCyW5WiP8HWh8prI7TKYgAAAAASUVORK5CYII=\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(X_tilde[2]).reshape(28,28), cmap='gray')" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Finally, let's add a regularization penalty on the hidden layer" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "First, let's define the model appropriately. Consider: What do we need to change from above variants? Think about the training loop (below.)" ] }, { "cell_type": "code", "execution_count": 223, "metadata": {}, "outputs": [], "source": [ "class AE_regularized(nn.Module):\n", " \n", " def __init__(self, input_size=784, hidden_size=2):\n", " '''\n", " In the initializer we setup model parameters/layers.\n", " '''\n", " super(AE_regularized, self).__init__() \n", "\n", " self.input_size = input_size\n", " self.hidden_size = hidden_size\n", " \n", " # input layer; from x -> z\n", " self.i = nn.Linear(self.input_size, self.hidden_size)\n", " \n", " self.a = nn.Sigmoid()\n", " \n", " # output layer\n", " self.o = nn.Linear(self.hidden_size, self.input_size)\n", " \n", "\n", " def forward(self, X):\n", " z = self.a(self.i(X))\n", " # Now we always return z along with the output\n", " return self.o(z), z" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "Now update the training loop to incorporate regularization. This will take a parameter `lambda_` that encodes how much weight to put on the regularization penalty (vs typical/reconstruction loss).\n", "\n", "Two hints: \n", "\n", "(1) Consider that we want to incur a loss associated with our regularization (an l1 norm); where should we do that?\n", "\n", "(2) See `torch.norm` (https://pytorch.org/docs/stable/torch.html#torch.norm)." ] }, { "cell_type": "code", "execution_count": 228, "metadata": {}, "outputs": [], "source": [ "def train_regularized_AE(X_in, X_target, model, optimizer, loss_function, lambda_, EPOCHS=10):\n", " for epoch in range(EPOCHS): \n", " idx, batch_num = 0, 0\n", " batch_size = 16\n", "\n", " print(\"\")\n", " while idx < 60000:\n", " # zero the parameter gradients\n", " optimizer.zero_grad()\n", "\n", " X_batch = X_in[idx: idx + batch_size].float()\n", " X_target_batch = X_target[idx: idx + batch_size].float()\n", " idx += batch_size\n", "\n", " # now run our X's forward, get preds, incur\n", " # loss, backprop, and step the optimizer.\n", " X_tilde_batch, z = model(X_batch)\n", " output_loss = loss_function(X_tilde_batch, X_target_batch)\n", " \n", " # here is the regularization loss.\n", " reg_loss = torch.norm(z, 1)\n", " \n", " loss = output_loss + lambda_ * reg_loss\n", " loss.backward()\n", " optimizer.step()\n", "\n", " # print out loss\n", " if batch_num % 100 == 0:\n", " print(\"epoch: {}, batch: {} // loss: {:.3f} // reg. loss (* \\lambda): {:.3f}\".format(\n", " epoch, batch_num, output_loss.item(), lambda_ * reg_loss.item()))\n", "\n", " batch_num += 1" ] }, { "cell_type": "code", "execution_count": 229, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 0.311 // reg. loss (* \\lambda): 125.579\n", "epoch: 0, batch: 100 // loss: 0.239 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 200 // loss: 0.207 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 300 // loss: 0.192 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 400 // loss: 0.196 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 500 // loss: 0.191 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 600 // loss: 0.189 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 700 // loss: 0.195 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 800 // loss: 0.162 // reg. loss (* \\lambda): 0.005\n", "epoch: 0, batch: 900 // loss: 0.198 // reg. loss (* \\lambda): 0.184\n", "epoch: 0, batch: 1000 // loss: 0.173 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1100 // loss: 0.196 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1200 // loss: 0.149 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1300 // loss: 0.179 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1400 // loss: 0.140 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1500 // loss: 0.140 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1600 // loss: 0.160 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1700 // loss: 0.144 // reg. loss (* \\lambda): 0.006\n", "epoch: 0, batch: 1800 // loss: 0.170 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 1900 // loss: 0.144 // reg. loss (* \\lambda): 0.001\n", "epoch: 0, batch: 2000 // loss: 0.122 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2100 // loss: 0.125 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2200 // loss: 0.155 // reg. loss (* \\lambda): 0.001\n", "epoch: 0, batch: 2300 // loss: 0.132 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2400 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2500 // loss: 0.106 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2600 // loss: 0.140 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2700 // loss: 0.103 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2800 // loss: 0.139 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 2900 // loss: 0.094 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3000 // loss: 0.106 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3100 // loss: 0.127 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3200 // loss: 0.090 // reg. loss (* \\lambda): 0.002\n", "epoch: 0, batch: 3300 // loss: 0.103 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3400 // loss: 0.101 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3500 // loss: 0.108 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3600 // loss: 0.111 // reg. loss (* \\lambda): 0.000\n", "epoch: 0, batch: 3700 // loss: 0.122 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 1, batch: 0 // loss: 0.115 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 100 // loss: 0.110 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 200 // loss: 0.108 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 300 // loss: 0.097 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 400 // loss: 0.101 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 500 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 600 // loss: 0.097 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 700 // loss: 0.102 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 800 // loss: 0.092 // reg. loss (* \\lambda): 0.004\n", "epoch: 1, batch: 900 // loss: 0.113 // reg. loss (* \\lambda): 0.161\n", "epoch: 1, batch: 1000 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1100 // loss: 0.110 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1200 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1300 // loss: 0.107 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1500 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1600 // loss: 0.101 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1700 // loss: 0.097 // reg. loss (* \\lambda): 0.005\n", "epoch: 1, batch: 1800 // loss: 0.107 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 1900 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2100 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2200 // loss: 0.108 // reg. loss (* \\lambda): 0.001\n", "epoch: 1, batch: 2300 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2400 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2600 // loss: 0.102 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2700 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2800 // loss: 0.105 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 2900 // loss: 0.075 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3000 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3100 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3200 // loss: 0.077 // reg. loss (* \\lambda): 0.001\n", "epoch: 1, batch: 3300 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3400 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3500 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 1, batch: 3700 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 2, batch: 0 // loss: 0.100 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 300 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 400 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 500 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 600 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 700 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 800 // loss: 0.085 // reg. loss (* \\lambda): 0.003\n", "epoch: 2, batch: 900 // loss: 0.099 // reg. loss (* \\lambda): 0.144\n", "epoch: 2, batch: 1000 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1100 // loss: 0.094 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1300 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1600 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.004\n", "epoch: 2, batch: 1800 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 1900 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2200 // loss: 0.100 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2300 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2400 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2500 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2600 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2800 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 2900 // loss: 0.075 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3000 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3100 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3200 // loss: 0.078 // reg. loss (* \\lambda): 0.001\n", "epoch: 2, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3500 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3600 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 2, batch: 3700 // loss: 0.094 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 3, batch: 0 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 100 // loss: 0.085 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 200 // loss: 0.095 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 300 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 400 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 500 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 3, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 700 // loss: 0.085 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 800 // loss: 0.085 // reg. loss (* \\lambda): 0.003\n", "epoch: 3, batch: 900 // loss: 0.097 // reg. loss (* \\lambda): 0.130\n", "epoch: 3, batch: 1000 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1100 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1200 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1300 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.004\n", "epoch: 3, batch: 1800 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2400 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2500 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2800 // loss: 0.097 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3000 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3200 // loss: 0.079 // reg. loss (* \\lambda): 0.001\n", "epoch: 3, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3500 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 3, batch: 3700 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 4, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 300 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 800 // loss: 0.085 // reg. loss (* \\lambda): 0.002\n", "epoch: 4, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.119\n", "epoch: 4, batch: 1000 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1100 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.003\n", "epoch: 4, batch: 1800 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2400 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2500 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 4, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 4, batch: 3700 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 5, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 300 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 800 // loss: 0.086 // reg. loss (* \\lambda): 0.002\n", "epoch: 5, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.110\n", "epoch: 5, batch: 1000 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1400 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.003\n", "epoch: 5, batch: 1800 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2500 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 5, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 5, batch: 3700 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 6, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 300 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 800 // loss: 0.086 // reg. loss (* \\lambda): 0.002\n", "epoch: 6, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.102\n", "epoch: 6, batch: 1000 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 6, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1400 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.003\n", "epoch: 6, batch: 1800 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2500 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 6, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 6, batch: 3700 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 7, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 300 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 800 // loss: 0.086 // reg. loss (* \\lambda): 0.001\n", "epoch: 7, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.096\n", "epoch: 7, batch: 1000 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1400 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.003\n", "epoch: 7, batch: 1800 // loss: 0.091 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2500 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 7, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 7, batch: 3700 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 8, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 300 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 800 // loss: 0.086 // reg. loss (* \\lambda): 0.001\n", "epoch: 8, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.090\n", "epoch: 8, batch: 1000 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1400 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.002\n", "epoch: 8, batch: 1800 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2500 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 8, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 8, batch: 3700 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "\n", "epoch: 9, batch: 0 // loss: 0.099 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 100 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 200 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 300 // loss: 0.087 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 400 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 500 // loss: 0.078 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 600 // loss: 0.081 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 700 // loss: 0.084 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 800 // loss: 0.086 // reg. loss (* \\lambda): 0.001\n", "epoch: 9, batch: 900 // loss: 0.096 // reg. loss (* \\lambda): 0.085\n", "epoch: 9, batch: 1000 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1200 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1300 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1400 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1700 // loss: 0.092 // reg. loss (* \\lambda): 0.002\n", "epoch: 9, batch: 1800 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 1900 // loss: 0.086 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2000 // loss: 0.079 // reg. loss (* \\lambda): 0.000\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 9, batch: 2100 // loss: 0.089 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2200 // loss: 0.098 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2300 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2400 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2500 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2600 // loss: 0.093 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2700 // loss: 0.077 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2800 // loss: 0.096 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 2900 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3000 // loss: 0.083 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3100 // loss: 0.088 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3200 // loss: 0.080 // reg. loss (* \\lambda): 0.001\n", "epoch: 9, batch: 3300 // loss: 0.080 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3400 // loss: 0.076 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3500 // loss: 0.082 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3600 // loss: 0.090 // reg. loss (* \\lambda): 0.000\n", "epoch: 9, batch: 3700 // loss: 0.092 // reg. loss (* \\lambda): 0.000\n" ] } ], "source": [ "AER = AE_regularized(hidden_size=16)\n", "optimizer = optim.SGD(AER.parameters(), lr=0.01, momentum=0.9)\n", "train_regularized_AE(X_corrupt, X, AER, optimizer, loss_function, 1)" ] }, { "cell_type": "markdown", "metadata": {}, "source": [ "### Variational auto-encoders\n", "\n", "First, let's review on board..." ] }, { "cell_type": "code", "execution_count": 176, "metadata": {}, "outputs": [], "source": [ "from torch.nn import functional as F\n", "\n", "class VAE(nn.Module):\n", " \n", " def __init__(self, input_size=784, hidden_size1=32, hidden_size2=32):\n", " '''\n", " In the initializer we setup model parameters/layers.\n", " '''\n", " super(VAE, self).__init__() \n", " \n", " ### encoder layers\n", " self.fc_e = nn.Linear(784, hidden_size1)\n", " self.fc_mean = nn.Linear(hidden_size1, hidden_size2)\n", " self.fc_logvar = nn.Linear(hidden_size1, hidden_size2)\n", " \n", " ### decoder layers\n", " self.fc_d1 = nn.Linear(hidden_size2, hidden_size1)\n", " self.fc_d2 = nn.Linear(hidden_size1, 784)\n", " \n", " \n", " def encoder(self, x_in):\n", " x = self.fc_e(x_in)\n", " mean = self.fc_mean(x)\n", " logvar = self.fc_logvar(x)\n", " return mean, logvar\n", " \n", " def decoder(self, z):\n", " z = F.relu(self.fc_d1(z))\n", " x_out = F.sigmoid(self.fc_d2(z))\n", " #return x_out.view(-1,1,28,28)\n", " return x_out\n", " \n", " def sample_normal(self, mean, logvar):\n", " # Using torch.normal(means,sds) returns a stochastic tensor which we cannot backpropogate through.\n", " # Instead we utilize the 'reparameterization trick'.\n", " # http://stats.stackexchange.com/a/205336\n", " # http://dpkingma.com/wordpress/wp-content/uploads/2015/12/talk_nips_workshop_2015.pdf\n", " sd = torch.exp(logvar*0.5)\n", " e = torch.tensor((torch.randn(sd.size()))) # Sample from standard normal\n", " z = e.mul(sd).add_(mean)\n", " return z\n", " \n", " def forward(self, x_in):\n", " z_mean, z_logvar = self.encoder(x_in)\n", " z = self.sample_normal(z_mean, z_logvar)\n", " x_out = self.decoder(z)\n", " return x_out, z_mean, z_logvar\n" ] }, { "cell_type": "code", "execution_count": 177, "metadata": {}, "outputs": [], "source": [ "def train_VAE(X_in, X_target, model, optimizer, loss_function, EPOCHS=10):\n", " for epoch in range(EPOCHS): \n", " idx, batch_num = 0, 0\n", " batch_size = 16\n", "\n", " print(\"\")\n", " while idx < 60000:\n", " # zero the parameter gradients\n", " optimizer.zero_grad()\n", "\n", " X_batch = X_in[idx: idx + batch_size].float()\n", " X_target_batch = X_target[idx: idx + batch_size].float()\n", " idx += batch_size\n", "\n", " # now run our X's forward, get preds, incur\n", " # loss, backprop, and step the optimizer.\n", " X_tilde_batch, _, _ = model(X_batch)\n", " loss = loss_function(X_tilde_batch, X_target_batch)\n", " loss.backward()\n", " optimizer.step()\n", "\n", " # print out loss\n", " if batch_num % 100 == 0:\n", " print(\"epoch: {}, batch: {} // loss: {:.3f}\".format(epoch, batch_num, loss.item()))\n", "\n", " batch_num += 1" ] }, { "cell_type": "code", "execution_count": 178, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "\n", "epoch: 0, batch: 0 // loss: 0.186\n", "epoch: 0, batch: 100 // loss: 0.157\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:39: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 0, batch: 200 // loss: 0.187\n", "epoch: 0, batch: 300 // loss: 0.175\n", "epoch: 0, batch: 400 // loss: 0.172\n", "epoch: 0, batch: 500 // loss: 0.162\n", "epoch: 0, batch: 600 // loss: 0.167\n", "epoch: 0, batch: 700 // loss: 0.164\n", "epoch: 0, batch: 800 // loss: 0.173\n", "epoch: 0, batch: 900 // loss: 0.167\n", "epoch: 0, batch: 1000 // loss: 0.152\n", "epoch: 0, batch: 1100 // loss: 0.157\n", "epoch: 0, batch: 1200 // loss: 0.153\n", "epoch: 0, batch: 1300 // loss: 0.148\n", "epoch: 0, batch: 1400 // loss: 0.155\n", "epoch: 0, batch: 1500 // loss: 0.148\n", "epoch: 0, batch: 1600 // loss: 0.147\n", "epoch: 0, batch: 1700 // loss: 0.144\n", "epoch: 0, batch: 1800 // loss: 0.132\n", "epoch: 0, batch: 1900 // loss: 0.135\n", "epoch: 0, batch: 2000 // loss: 0.119\n", "epoch: 0, batch: 2100 // loss: 0.123\n", "epoch: 0, batch: 2200 // loss: 0.127\n", "epoch: 0, batch: 2300 // loss: 0.119\n", "epoch: 0, batch: 2400 // loss: 0.109\n", "epoch: 0, batch: 2500 // loss: 0.100\n", "epoch: 0, batch: 2600 // loss: 0.107\n", "epoch: 0, batch: 2700 // loss: 0.094\n", "epoch: 0, batch: 2800 // loss: 0.104\n", "epoch: 0, batch: 2900 // loss: 0.091\n", "epoch: 0, batch: 3000 // loss: 0.094\n", "epoch: 0, batch: 3100 // loss: 0.089\n", "epoch: 0, batch: 3200 // loss: 0.093\n", "epoch: 0, batch: 3300 // loss: 0.088\n", "epoch: 0, batch: 3400 // loss: 0.078\n", "epoch: 0, batch: 3500 // loss: 0.084\n", "epoch: 0, batch: 3600 // loss: 0.099\n", "epoch: 0, batch: 3700 // loss: 0.092\n", "\n", "epoch: 1, batch: 0 // loss: 0.108\n", "epoch: 1, batch: 100 // loss: 0.089\n", "epoch: 1, batch: 200 // loss: 0.101\n", "epoch: 1, batch: 300 // loss: 0.090\n", "epoch: 1, batch: 400 // loss: 0.094\n", "epoch: 1, batch: 500 // loss: 0.080\n", "epoch: 1, batch: 600 // loss: 0.086\n", "epoch: 1, batch: 700 // loss: 0.086\n", "epoch: 1, batch: 800 // loss: 0.089\n", "epoch: 1, batch: 900 // loss: 0.093\n", "epoch: 1, batch: 1000 // loss: 0.075\n", "epoch: 1, batch: 1100 // loss: 0.086\n", "epoch: 1, batch: 1200 // loss: 0.084\n", "epoch: 1, batch: 1300 // loss: 0.086\n", "epoch: 1, batch: 1400 // loss: 0.084\n", "epoch: 1, batch: 1500 // loss: 0.079\n", "epoch: 1, batch: 1600 // loss: 0.089\n", "epoch: 1, batch: 1700 // loss: 0.089\n", "epoch: 1, batch: 1800 // loss: 0.086\n", "epoch: 1, batch: 1900 // loss: 0.082\n", "epoch: 1, batch: 2000 // loss: 0.071\n", "epoch: 1, batch: 2100 // loss: 0.085\n", "epoch: 1, batch: 2200 // loss: 0.093\n", "epoch: 1, batch: 2300 // loss: 0.087\n", "epoch: 1, batch: 2400 // loss: 0.075\n", "epoch: 1, batch: 2500 // loss: 0.072\n", "epoch: 1, batch: 2600 // loss: 0.083\n", "epoch: 1, batch: 2700 // loss: 0.074\n", "epoch: 1, batch: 2800 // loss: 0.084\n", "epoch: 1, batch: 2900 // loss: 0.073\n", "epoch: 1, batch: 3000 // loss: 0.075\n", "epoch: 1, batch: 3100 // loss: 0.071\n", "epoch: 1, batch: 3200 // loss: 0.070\n", "epoch: 1, batch: 3300 // loss: 0.068\n", "epoch: 1, batch: 3400 // loss: 0.062\n", "epoch: 1, batch: 3500 // loss: 0.063\n", "epoch: 1, batch: 3600 // loss: 0.074\n", "epoch: 1, batch: 3700 // loss: 0.071\n", "\n", "epoch: 2, batch: 0 // loss: 0.086\n", "epoch: 2, batch: 100 // loss: 0.075\n", "epoch: 2, batch: 200 // loss: 0.070\n", "epoch: 2, batch: 300 // loss: 0.072\n", "epoch: 2, batch: 400 // loss: 0.073\n", "epoch: 2, batch: 500 // loss: 0.059\n", "epoch: 2, batch: 600 // loss: 0.065\n", "epoch: 2, batch: 700 // loss: 0.065\n", "epoch: 2, batch: 800 // loss: 0.067\n", "epoch: 2, batch: 900 // loss: 0.072\n", "epoch: 2, batch: 1000 // loss: 0.056\n", "epoch: 2, batch: 1100 // loss: 0.062\n", "epoch: 2, batch: 1200 // loss: 0.060\n", "epoch: 2, batch: 1300 // loss: 0.067\n", "epoch: 2, batch: 1400 // loss: 0.060\n", "epoch: 2, batch: 1500 // loss: 0.061\n", "epoch: 2, batch: 1600 // loss: 0.068\n", "epoch: 2, batch: 1700 // loss: 0.063\n", "epoch: 2, batch: 1800 // loss: 0.066\n", "epoch: 2, batch: 1900 // loss: 0.060\n", "epoch: 2, batch: 2000 // loss: 0.057\n", "epoch: 2, batch: 2100 // loss: 0.062\n", "epoch: 2, batch: 2200 // loss: 0.070\n", "epoch: 2, batch: 2300 // loss: 0.067\n", "epoch: 2, batch: 2400 // loss: 0.049\n", "epoch: 2, batch: 2500 // loss: 0.054\n", "epoch: 2, batch: 2600 // loss: 0.058\n", "epoch: 2, batch: 2700 // loss: 0.055\n", "epoch: 2, batch: 2800 // loss: 0.059\n", "epoch: 2, batch: 2900 // loss: 0.056\n", "epoch: 2, batch: 3000 // loss: 0.057\n", "epoch: 2, batch: 3100 // loss: 0.050\n", "epoch: 2, batch: 3200 // loss: 0.050\n", "epoch: 2, batch: 3300 // loss: 0.049\n", "epoch: 2, batch: 3400 // loss: 0.048\n", "epoch: 2, batch: 3500 // loss: 0.042\n", "epoch: 2, batch: 3600 // loss: 0.052\n", "epoch: 2, batch: 3700 // loss: 0.051\n", "\n", "epoch: 3, batch: 0 // loss: 0.067\n", "epoch: 3, batch: 100 // loss: 0.060\n", "epoch: 3, batch: 200 // loss: 0.051\n", "epoch: 3, batch: 300 // loss: 0.058\n", "epoch: 3, batch: 400 // loss: 0.056\n", "epoch: 3, batch: 500 // loss: 0.045\n", "epoch: 3, batch: 600 // loss: 0.048\n", "epoch: 3, batch: 700 // loss: 0.051\n", "epoch: 3, batch: 800 // loss: 0.052\n", "epoch: 3, batch: 900 // loss: 0.058\n", "epoch: 3, batch: 1000 // loss: 0.046\n", "epoch: 3, batch: 1100 // loss: 0.048\n", "epoch: 3, batch: 1200 // loss: 0.050\n", "epoch: 3, batch: 1300 // loss: 0.053\n", "epoch: 3, batch: 1400 // loss: 0.047\n", "epoch: 3, batch: 1500 // loss: 0.052\n", "epoch: 3, batch: 1600 // loss: 0.059\n", "epoch: 3, batch: 1700 // loss: 0.050\n", "epoch: 3, batch: 1800 // loss: 0.055\n", "epoch: 3, batch: 1900 // loss: 0.050\n", "epoch: 3, batch: 2000 // loss: 0.049\n", "epoch: 3, batch: 2100 // loss: 0.052\n", "epoch: 3, batch: 2200 // loss: 0.055\n", "epoch: 3, batch: 2300 // loss: 0.054\n", "epoch: 3, batch: 2400 // loss: 0.043\n", "epoch: 3, batch: 2500 // loss: 0.046\n", "epoch: 3, batch: 2600 // loss: 0.048\n", "epoch: 3, batch: 2700 // loss: 0.046\n", "epoch: 3, batch: 2800 // loss: 0.048\n", "epoch: 3, batch: 2900 // loss: 0.048\n", "epoch: 3, batch: 3000 // loss: 0.050\n", "epoch: 3, batch: 3100 // loss: 0.043\n", "epoch: 3, batch: 3200 // loss: 0.043\n", "epoch: 3, batch: 3300 // loss: 0.041\n", "epoch: 3, batch: 3400 // loss: 0.044\n", "epoch: 3, batch: 3500 // loss: 0.035\n", "epoch: 3, batch: 3600 // loss: 0.044\n", "epoch: 3, batch: 3700 // loss: 0.044\n", "\n", "epoch: 4, batch: 0 // loss: 0.057\n", "epoch: 4, batch: 100 // loss: 0.049\n", "epoch: 4, batch: 200 // loss: 0.044\n", "epoch: 4, batch: 300 // loss: 0.052\n", "epoch: 4, batch: 400 // loss: 0.047\n", "epoch: 4, batch: 500 // loss: 0.040\n", "epoch: 4, batch: 600 // loss: 0.041\n", "epoch: 4, batch: 700 // loss: 0.045\n", "epoch: 4, batch: 800 // loss: 0.042\n", "epoch: 4, batch: 900 // loss: 0.050\n", "epoch: 4, batch: 1000 // loss: 0.043\n", "epoch: 4, batch: 1100 // loss: 0.043\n", "epoch: 4, batch: 1200 // loss: 0.045\n", "epoch: 4, batch: 1300 // loss: 0.046\n", "epoch: 4, batch: 1400 // loss: 0.042\n", "epoch: 4, batch: 1500 // loss: 0.046\n", "epoch: 4, batch: 1600 // loss: 0.053\n", "epoch: 4, batch: 1700 // loss: 0.043\n", "epoch: 4, batch: 1800 // loss: 0.050\n", "epoch: 4, batch: 1900 // loss: 0.044\n", "epoch: 4, batch: 2000 // loss: 0.045\n", "epoch: 4, batch: 2100 // loss: 0.046\n", "epoch: 4, batch: 2200 // loss: 0.048\n", "epoch: 4, batch: 2300 // loss: 0.049\n", "epoch: 4, batch: 2400 // loss: 0.041\n", "epoch: 4, batch: 2500 // loss: 0.042\n", "epoch: 4, batch: 2600 // loss: 0.044\n", "epoch: 4, batch: 2700 // loss: 0.042\n", "epoch: 4, batch: 2800 // loss: 0.043\n", "epoch: 4, batch: 2900 // loss: 0.044\n", "epoch: 4, batch: 3000 // loss: 0.046\n", "epoch: 4, batch: 3100 // loss: 0.040\n", "epoch: 4, batch: 3200 // loss: 0.038\n", "epoch: 4, batch: 3300 // loss: 0.038\n", "epoch: 4, batch: 3400 // loss: 0.042\n", "epoch: 4, batch: 3500 // loss: 0.032\n", "epoch: 4, batch: 3600 // loss: 0.041\n", "epoch: 4, batch: 3700 // loss: 0.040\n", "\n", "epoch: 5, batch: 0 // loss: 0.052\n", "epoch: 5, batch: 100 // loss: 0.045\n", "epoch: 5, batch: 200 // loss: 0.041\n", "epoch: 5, batch: 300 // loss: 0.048\n", "epoch: 5, batch: 400 // loss: 0.044\n", "epoch: 5, batch: 500 // loss: 0.038\n", "epoch: 5, batch: 600 // loss: 0.038\n", "epoch: 5, batch: 700 // loss: 0.041\n", "epoch: 5, batch: 800 // loss: 0.039\n", "epoch: 5, batch: 900 // loss: 0.046\n", "epoch: 5, batch: 1000 // loss: 0.042\n", "epoch: 5, batch: 1100 // loss: 0.041\n", "epoch: 5, batch: 1200 // loss: 0.043\n", "epoch: 5, batch: 1300 // loss: 0.043\n", "epoch: 5, batch: 1400 // loss: 0.040\n", "epoch: 5, batch: 1500 // loss: 0.043\n", "epoch: 5, batch: 1600 // loss: 0.050\n", "epoch: 5, batch: 1700 // loss: 0.040\n", "epoch: 5, batch: 1800 // loss: 0.048\n", "epoch: 5, batch: 1900 // loss: 0.042\n", "epoch: 5, batch: 2000 // loss: 0.043\n", "epoch: 5, batch: 2100 // loss: 0.044\n", "epoch: 5, batch: 2200 // loss: 0.045\n", "epoch: 5, batch: 2300 // loss: 0.046\n", "epoch: 5, batch: 2400 // loss: 0.039\n", "epoch: 5, batch: 2500 // loss: 0.040\n", "epoch: 5, batch: 2600 // loss: 0.042\n", "epoch: 5, batch: 2700 // loss: 0.041\n", "epoch: 5, batch: 2800 // loss: 0.041\n", "epoch: 5, batch: 2900 // loss: 0.042\n", "epoch: 5, batch: 3000 // loss: 0.044\n", "epoch: 5, batch: 3100 // loss: 0.040\n", "epoch: 5, batch: 3200 // loss: 0.036\n", "epoch: 5, batch: 3300 // loss: 0.036\n", "epoch: 5, batch: 3400 // loss: 0.041\n", "epoch: 5, batch: 3500 // loss: 0.031\n", "epoch: 5, batch: 3600 // loss: 0.040\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 5, batch: 3700 // loss: 0.038\n", "\n", "epoch: 6, batch: 0 // loss: 0.051\n", "epoch: 6, batch: 100 // loss: 0.043\n", "epoch: 6, batch: 200 // loss: 0.039\n", "epoch: 6, batch: 300 // loss: 0.047\n", "epoch: 6, batch: 400 // loss: 0.043\n", "epoch: 6, batch: 500 // loss: 0.037\n", "epoch: 6, batch: 600 // loss: 0.037\n", "epoch: 6, batch: 700 // loss: 0.041\n", "epoch: 6, batch: 800 // loss: 0.037\n", "epoch: 6, batch: 900 // loss: 0.045\n", "epoch: 6, batch: 1000 // loss: 0.042\n", "epoch: 6, batch: 1100 // loss: 0.041\n", "epoch: 6, batch: 1200 // loss: 0.042\n", "epoch: 6, batch: 1300 // loss: 0.042\n", "epoch: 6, batch: 1400 // loss: 0.040\n", "epoch: 6, batch: 1500 // loss: 0.042\n", "epoch: 6, batch: 1600 // loss: 0.049\n", "epoch: 6, batch: 1700 // loss: 0.039\n", "epoch: 6, batch: 1800 // loss: 0.047\n", "epoch: 6, batch: 1900 // loss: 0.041\n", "epoch: 6, batch: 2000 // loss: 0.042\n", "epoch: 6, batch: 2100 // loss: 0.042\n", "epoch: 6, batch: 2200 // loss: 0.044\n", "epoch: 6, batch: 2300 // loss: 0.045\n", "epoch: 6, batch: 2400 // loss: 0.038\n", "epoch: 6, batch: 2500 // loss: 0.039\n", "epoch: 6, batch: 2600 // loss: 0.042\n", "epoch: 6, batch: 2700 // loss: 0.041\n", "epoch: 6, batch: 2800 // loss: 0.040\n", "epoch: 6, batch: 2900 // loss: 0.041\n", "epoch: 6, batch: 3000 // loss: 0.044\n", "epoch: 6, batch: 3100 // loss: 0.039\n", "epoch: 6, batch: 3200 // loss: 0.036\n", "epoch: 6, batch: 3300 // loss: 0.035\n", "epoch: 6, batch: 3400 // loss: 0.040\n", "epoch: 6, batch: 3500 // loss: 0.030\n", "epoch: 6, batch: 3600 // loss: 0.039\n", "epoch: 6, batch: 3700 // loss: 0.037\n", "\n", "epoch: 7, batch: 0 // loss: 0.049\n", "epoch: 7, batch: 100 // loss: 0.042\n", "epoch: 7, batch: 200 // loss: 0.038\n", "epoch: 7, batch: 300 // loss: 0.046\n", "epoch: 7, batch: 400 // loss: 0.042\n", "epoch: 7, batch: 500 // loss: 0.036\n", "epoch: 7, batch: 600 // loss: 0.036\n", "epoch: 7, batch: 700 // loss: 0.040\n", "epoch: 7, batch: 800 // loss: 0.036\n", "epoch: 7, batch: 900 // loss: 0.044\n", "epoch: 7, batch: 1000 // loss: 0.042\n", "epoch: 7, batch: 1100 // loss: 0.040\n", "epoch: 7, batch: 1200 // loss: 0.041\n", "epoch: 7, batch: 1300 // loss: 0.042\n", "epoch: 7, batch: 1400 // loss: 0.039\n", "epoch: 7, batch: 1500 // loss: 0.042\n", "epoch: 7, batch: 1600 // loss: 0.048\n", "epoch: 7, batch: 1700 // loss: 0.038\n", "epoch: 7, batch: 1800 // loss: 0.046\n", "epoch: 7, batch: 1900 // loss: 0.041\n", "epoch: 7, batch: 2000 // loss: 0.042\n", "epoch: 7, batch: 2100 // loss: 0.041\n", "epoch: 7, batch: 2200 // loss: 0.043\n", "epoch: 7, batch: 2300 // loss: 0.044\n", "epoch: 7, batch: 2400 // loss: 0.037\n", "epoch: 7, batch: 2500 // loss: 0.039\n", "epoch: 7, batch: 2600 // loss: 0.041\n", "epoch: 7, batch: 2700 // loss: 0.040\n", "epoch: 7, batch: 2800 // loss: 0.039\n", "epoch: 7, batch: 2900 // loss: 0.040\n", "epoch: 7, batch: 3000 // loss: 0.043\n", "epoch: 7, batch: 3100 // loss: 0.039\n", "epoch: 7, batch: 3200 // loss: 0.035\n", "epoch: 7, batch: 3300 // loss: 0.034\n", "epoch: 7, batch: 3400 // loss: 0.040\n", "epoch: 7, batch: 3500 // loss: 0.030\n", "epoch: 7, batch: 3600 // loss: 0.038\n", "epoch: 7, batch: 3700 // loss: 0.037\n", "\n", "epoch: 8, batch: 0 // loss: 0.048\n", "epoch: 8, batch: 100 // loss: 0.041\n", "epoch: 8, batch: 200 // loss: 0.037\n", "epoch: 8, batch: 300 // loss: 0.045\n", "epoch: 8, batch: 400 // loss: 0.041\n", "epoch: 8, batch: 500 // loss: 0.035\n", "epoch: 8, batch: 600 // loss: 0.036\n", "epoch: 8, batch: 700 // loss: 0.039\n", "epoch: 8, batch: 800 // loss: 0.036\n", "epoch: 8, batch: 900 // loss: 0.043\n", "epoch: 8, batch: 1000 // loss: 0.041\n", "epoch: 8, batch: 1100 // loss: 0.039\n", "epoch: 8, batch: 1200 // loss: 0.040\n", "epoch: 8, batch: 1300 // loss: 0.041\n", "epoch: 8, batch: 1400 // loss: 0.038\n", "epoch: 8, batch: 1500 // loss: 0.041\n", "epoch: 8, batch: 1600 // loss: 0.047\n", "epoch: 8, batch: 1700 // loss: 0.037\n", "epoch: 8, batch: 1800 // loss: 0.046\n", "epoch: 8, batch: 1900 // loss: 0.039\n", "epoch: 8, batch: 2000 // loss: 0.041\n", "epoch: 8, batch: 2100 // loss: 0.040\n", "epoch: 8, batch: 2200 // loss: 0.042\n", "epoch: 8, batch: 2300 // loss: 0.043\n", "epoch: 8, batch: 2400 // loss: 0.037\n", "epoch: 8, batch: 2500 // loss: 0.038\n", "epoch: 8, batch: 2600 // loss: 0.041\n", "epoch: 8, batch: 2700 // loss: 0.039\n", "epoch: 8, batch: 2800 // loss: 0.038\n", "epoch: 8, batch: 2900 // loss: 0.039\n", "epoch: 8, batch: 3000 // loss: 0.042\n", "epoch: 8, batch: 3100 // loss: 0.038\n", "epoch: 8, batch: 3200 // loss: 0.034\n", "epoch: 8, batch: 3300 // loss: 0.034\n", "epoch: 8, batch: 3400 // loss: 0.039\n", "epoch: 8, batch: 3500 // loss: 0.029\n", "epoch: 8, batch: 3600 // loss: 0.037\n", "epoch: 8, batch: 3700 // loss: 0.036\n", "\n", "epoch: 9, batch: 0 // loss: 0.047\n", "epoch: 9, batch: 100 // loss: 0.040\n", "epoch: 9, batch: 200 // loss: 0.036\n", "epoch: 9, batch: 300 // loss: 0.044\n", "epoch: 9, batch: 400 // loss: 0.040\n", "epoch: 9, batch: 500 // loss: 0.035\n", "epoch: 9, batch: 600 // loss: 0.035\n", "epoch: 9, batch: 700 // loss: 0.038\n", "epoch: 9, batch: 800 // loss: 0.035\n", "epoch: 9, batch: 900 // loss: 0.042\n", "epoch: 9, batch: 1000 // loss: 0.040\n", "epoch: 9, batch: 1100 // loss: 0.038\n", "epoch: 9, batch: 1200 // loss: 0.039\n", "epoch: 9, batch: 1300 // loss: 0.040\n", "epoch: 9, batch: 1400 // loss: 0.037\n", "epoch: 9, batch: 1500 // loss: 0.039\n", "epoch: 9, batch: 1600 // loss: 0.046\n", "epoch: 9, batch: 1700 // loss: 0.036\n", "epoch: 9, batch: 1800 // loss: 0.044\n", "epoch: 9, batch: 1900 // loss: 0.037\n", "epoch: 9, batch: 2000 // loss: 0.040\n", "epoch: 9, batch: 2100 // loss: 0.039\n", "epoch: 9, batch: 2200 // loss: 0.041\n", "epoch: 9, batch: 2300 // loss: 0.041\n", "epoch: 9, batch: 2400 // loss: 0.036\n", "epoch: 9, batch: 2500 // loss: 0.037\n", "epoch: 9, batch: 2600 // loss: 0.040\n", "epoch: 9, batch: 2700 // loss: 0.037\n", "epoch: 9, batch: 2800 // loss: 0.036\n", "epoch: 9, batch: 2900 // loss: 0.038\n", "epoch: 9, batch: 3000 // loss: 0.041\n", "epoch: 9, batch: 3100 // loss: 0.038\n", "epoch: 9, batch: 3200 // loss: 0.033\n", "epoch: 9, batch: 3300 // loss: 0.033\n", "epoch: 9, batch: 3400 // loss: 0.037\n", "epoch: 9, batch: 3500 // loss: 0.028\n", "epoch: 9, batch: 3600 // loss: 0.036\n", "epoch: 9, batch: 3700 // loss: 0.035\n", "\n", "epoch: 10, batch: 0 // loss: 0.045\n", "epoch: 10, batch: 100 // loss: 0.039\n", "epoch: 10, batch: 200 // loss: 0.035\n", "epoch: 10, batch: 300 // loss: 0.043\n", "epoch: 10, batch: 400 // loss: 0.039\n", "epoch: 10, batch: 500 // loss: 0.034\n", "epoch: 10, batch: 600 // loss: 0.034\n", "epoch: 10, batch: 700 // loss: 0.037\n", "epoch: 10, batch: 800 // loss: 0.034\n", "epoch: 10, batch: 900 // loss: 0.041\n", "epoch: 10, batch: 1000 // loss: 0.039\n", "epoch: 10, batch: 1100 // loss: 0.037\n", "epoch: 10, batch: 1200 // loss: 0.037\n", "epoch: 10, batch: 1300 // loss: 0.039\n", "epoch: 10, batch: 1400 // loss: 0.036\n", "epoch: 10, batch: 1500 // loss: 0.038\n", "epoch: 10, batch: 1600 // loss: 0.044\n", "epoch: 10, batch: 1700 // loss: 0.035\n", "epoch: 10, batch: 1800 // loss: 0.043\n", "epoch: 10, batch: 1900 // loss: 0.035\n", "epoch: 10, batch: 2000 // loss: 0.039\n", "epoch: 10, batch: 2100 // loss: 0.038\n", "epoch: 10, batch: 2200 // loss: 0.039\n", "epoch: 10, batch: 2300 // loss: 0.040\n", "epoch: 10, batch: 2400 // loss: 0.034\n", "epoch: 10, batch: 2500 // loss: 0.035\n", "epoch: 10, batch: 2600 // loss: 0.038\n", "epoch: 10, batch: 2700 // loss: 0.036\n", "epoch: 10, batch: 2800 // loss: 0.034\n", "epoch: 10, batch: 2900 // loss: 0.037\n", "epoch: 10, batch: 3000 // loss: 0.040\n", "epoch: 10, batch: 3100 // loss: 0.037\n", "epoch: 10, batch: 3200 // loss: 0.031\n", "epoch: 10, batch: 3300 // loss: 0.031\n", "epoch: 10, batch: 3400 // loss: 0.036\n", "epoch: 10, batch: 3500 // loss: 0.027\n", "epoch: 10, batch: 3600 // loss: 0.034\n", "epoch: 10, batch: 3700 // loss: 0.033\n", "\n", "epoch: 11, batch: 0 // loss: 0.044\n", "epoch: 11, batch: 100 // loss: 0.037\n", "epoch: 11, batch: 200 // loss: 0.034\n", "epoch: 11, batch: 300 // loss: 0.041\n", "epoch: 11, batch: 400 // loss: 0.037\n", "epoch: 11, batch: 500 // loss: 0.033\n", "epoch: 11, batch: 600 // loss: 0.033\n", "epoch: 11, batch: 700 // loss: 0.035\n", "epoch: 11, batch: 800 // loss: 0.032\n", "epoch: 11, batch: 900 // loss: 0.040\n", "epoch: 11, batch: 1000 // loss: 0.038\n", "epoch: 11, batch: 1100 // loss: 0.036\n", "epoch: 11, batch: 1200 // loss: 0.036\n", "epoch: 11, batch: 1300 // loss: 0.039\n", "epoch: 11, batch: 1400 // loss: 0.035\n", "epoch: 11, batch: 1500 // loss: 0.037\n", "epoch: 11, batch: 1600 // loss: 0.042\n", "epoch: 11, batch: 1700 // loss: 0.033\n", "epoch: 11, batch: 1800 // loss: 0.041\n", "epoch: 11, batch: 1900 // loss: 0.033\n", "epoch: 11, batch: 2000 // loss: 0.038\n", "epoch: 11, batch: 2100 // loss: 0.036\n", "epoch: 11, batch: 2200 // loss: 0.038\n", "epoch: 11, batch: 2300 // loss: 0.039\n", "epoch: 11, batch: 2400 // loss: 0.033\n", "epoch: 11, batch: 2500 // loss: 0.034\n", "epoch: 11, batch: 2600 // loss: 0.037\n", "epoch: 11, batch: 2700 // loss: 0.035\n", "epoch: 11, batch: 2800 // loss: 0.033\n", "epoch: 11, batch: 2900 // loss: 0.036\n", "epoch: 11, batch: 3000 // loss: 0.039\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 11, batch: 3100 // loss: 0.037\n", "epoch: 11, batch: 3200 // loss: 0.030\n", "epoch: 11, batch: 3300 // loss: 0.030\n", "epoch: 11, batch: 3400 // loss: 0.035\n", "epoch: 11, batch: 3500 // loss: 0.026\n", "epoch: 11, batch: 3600 // loss: 0.033\n", "epoch: 11, batch: 3700 // loss: 0.032\n", "\n", "epoch: 12, batch: 0 // loss: 0.042\n", "epoch: 12, batch: 100 // loss: 0.036\n", "epoch: 12, batch: 200 // loss: 0.033\n", "epoch: 12, batch: 300 // loss: 0.040\n", "epoch: 12, batch: 400 // loss: 0.036\n", "epoch: 12, batch: 500 // loss: 0.033\n", "epoch: 12, batch: 600 // loss: 0.033\n", "epoch: 12, batch: 700 // loss: 0.035\n", "epoch: 12, batch: 800 // loss: 0.031\n", "epoch: 12, batch: 900 // loss: 0.039\n", "epoch: 12, batch: 1000 // loss: 0.037\n", "epoch: 12, batch: 1100 // loss: 0.036\n", "epoch: 12, batch: 1200 // loss: 0.035\n", "epoch: 12, batch: 1300 // loss: 0.037\n", "epoch: 12, batch: 1400 // loss: 0.034\n", "epoch: 12, batch: 1500 // loss: 0.035\n", "epoch: 12, batch: 1600 // loss: 0.041\n", "epoch: 12, batch: 1700 // loss: 0.033\n", "epoch: 12, batch: 1800 // loss: 0.040\n", "epoch: 12, batch: 1900 // loss: 0.032\n", "epoch: 12, batch: 2000 // loss: 0.037\n", "epoch: 12, batch: 2100 // loss: 0.035\n", "epoch: 12, batch: 2200 // loss: 0.037\n", "epoch: 12, batch: 2300 // loss: 0.038\n", "epoch: 12, batch: 2400 // loss: 0.032\n", "epoch: 12, batch: 2500 // loss: 0.034\n", "epoch: 12, batch: 2600 // loss: 0.037\n", "epoch: 12, batch: 2700 // loss: 0.034\n", "epoch: 12, batch: 2800 // loss: 0.031\n", "epoch: 12, batch: 2900 // loss: 0.035\n", "epoch: 12, batch: 3000 // loss: 0.038\n", "epoch: 12, batch: 3100 // loss: 0.036\n", "epoch: 12, batch: 3200 // loss: 0.030\n", "epoch: 12, batch: 3300 // loss: 0.030\n", "epoch: 12, batch: 3400 // loss: 0.034\n", "epoch: 12, batch: 3500 // loss: 0.025\n", "epoch: 12, batch: 3600 // loss: 0.032\n", "epoch: 12, batch: 3700 // loss: 0.032\n", "\n", "epoch: 13, batch: 0 // loss: 0.042\n", "epoch: 13, batch: 100 // loss: 0.035\n", "epoch: 13, batch: 200 // loss: 0.032\n", "epoch: 13, batch: 300 // loss: 0.039\n", "epoch: 13, batch: 400 // loss: 0.035\n", "epoch: 13, batch: 500 // loss: 0.032\n", "epoch: 13, batch: 600 // loss: 0.032\n", "epoch: 13, batch: 700 // loss: 0.034\n", "epoch: 13, batch: 800 // loss: 0.031\n", "epoch: 13, batch: 900 // loss: 0.039\n", "epoch: 13, batch: 1000 // loss: 0.036\n", "epoch: 13, batch: 1100 // loss: 0.035\n", "epoch: 13, batch: 1200 // loss: 0.034\n", "epoch: 13, batch: 1300 // loss: 0.037\n", "epoch: 13, batch: 1400 // loss: 0.033\n", "epoch: 13, batch: 1500 // loss: 0.035\n", "epoch: 13, batch: 1600 // loss: 0.040\n", "epoch: 13, batch: 1700 // loss: 0.032\n", "epoch: 13, batch: 1800 // loss: 0.039\n", "epoch: 13, batch: 1900 // loss: 0.031\n", "epoch: 13, batch: 2000 // loss: 0.037\n", "epoch: 13, batch: 2100 // loss: 0.034\n", "epoch: 13, batch: 2200 // loss: 0.037\n", "epoch: 13, batch: 2300 // loss: 0.037\n", "epoch: 13, batch: 2400 // loss: 0.032\n", "epoch: 13, batch: 2500 // loss: 0.033\n", "epoch: 13, batch: 2600 // loss: 0.036\n", "epoch: 13, batch: 2700 // loss: 0.034\n", "epoch: 13, batch: 2800 // loss: 0.030\n", "epoch: 13, batch: 2900 // loss: 0.035\n", "epoch: 13, batch: 3000 // loss: 0.037\n", "epoch: 13, batch: 3100 // loss: 0.036\n", "epoch: 13, batch: 3200 // loss: 0.029\n", "epoch: 13, batch: 3300 // loss: 0.029\n", "epoch: 13, batch: 3400 // loss: 0.034\n", "epoch: 13, batch: 3500 // loss: 0.025\n", "epoch: 13, batch: 3600 // loss: 0.031\n", "epoch: 13, batch: 3700 // loss: 0.031\n", "\n", "epoch: 14, batch: 0 // loss: 0.041\n", "epoch: 14, batch: 100 // loss: 0.035\n", "epoch: 14, batch: 200 // loss: 0.031\n", "epoch: 14, batch: 300 // loss: 0.038\n", "epoch: 14, batch: 400 // loss: 0.034\n", "epoch: 14, batch: 500 // loss: 0.032\n", "epoch: 14, batch: 600 // loss: 0.032\n", "epoch: 14, batch: 700 // loss: 0.033\n", "epoch: 14, batch: 800 // loss: 0.030\n", "epoch: 14, batch: 900 // loss: 0.038\n", "epoch: 14, batch: 1000 // loss: 0.036\n", "epoch: 14, batch: 1100 // loss: 0.034\n", "epoch: 14, batch: 1200 // loss: 0.033\n", "epoch: 14, batch: 1300 // loss: 0.036\n", "epoch: 14, batch: 1400 // loss: 0.033\n", "epoch: 14, batch: 1500 // loss: 0.034\n", "epoch: 14, batch: 1600 // loss: 0.039\n", "epoch: 14, batch: 1700 // loss: 0.031\n", "epoch: 14, batch: 1800 // loss: 0.038\n", "epoch: 14, batch: 1900 // loss: 0.030\n", "epoch: 14, batch: 2000 // loss: 0.036\n", "epoch: 14, batch: 2100 // loss: 0.034\n", "epoch: 14, batch: 2200 // loss: 0.036\n", "epoch: 14, batch: 2300 // loss: 0.036\n", "epoch: 14, batch: 2400 // loss: 0.031\n", "epoch: 14, batch: 2500 // loss: 0.033\n", "epoch: 14, batch: 2600 // loss: 0.035\n", "epoch: 14, batch: 2700 // loss: 0.033\n", "epoch: 14, batch: 2800 // loss: 0.030\n", "epoch: 14, batch: 2900 // loss: 0.034\n", "epoch: 14, batch: 3000 // loss: 0.037\n", "epoch: 14, batch: 3100 // loss: 0.035\n", "epoch: 14, batch: 3200 // loss: 0.029\n", "epoch: 14, batch: 3300 // loss: 0.029\n", "epoch: 14, batch: 3400 // loss: 0.033\n", "epoch: 14, batch: 3500 // loss: 0.025\n", "epoch: 14, batch: 3600 // loss: 0.031\n", "epoch: 14, batch: 3700 // loss: 0.030\n", "\n", "epoch: 15, batch: 0 // loss: 0.040\n", "epoch: 15, batch: 100 // loss: 0.034\n", "epoch: 15, batch: 200 // loss: 0.031\n", "epoch: 15, batch: 300 // loss: 0.038\n", "epoch: 15, batch: 400 // loss: 0.034\n", "epoch: 15, batch: 500 // loss: 0.032\n", "epoch: 15, batch: 600 // loss: 0.031\n", "epoch: 15, batch: 700 // loss: 0.033\n", "epoch: 15, batch: 800 // loss: 0.029\n", "epoch: 15, batch: 900 // loss: 0.038\n", "epoch: 15, batch: 1000 // loss: 0.036\n", "epoch: 15, batch: 1100 // loss: 0.034\n", "epoch: 15, batch: 1200 // loss: 0.033\n", "epoch: 15, batch: 1300 // loss: 0.036\n", "epoch: 15, batch: 1400 // loss: 0.033\n", "epoch: 15, batch: 1500 // loss: 0.034\n", "epoch: 15, batch: 1600 // loss: 0.039\n", "epoch: 15, batch: 1700 // loss: 0.031\n", "epoch: 15, batch: 1800 // loss: 0.037\n", "epoch: 15, batch: 1900 // loss: 0.030\n", "epoch: 15, batch: 2000 // loss: 0.035\n", "epoch: 15, batch: 2100 // loss: 0.033\n", "epoch: 15, batch: 2200 // loss: 0.036\n", "epoch: 15, batch: 2300 // loss: 0.036\n", "epoch: 15, batch: 2400 // loss: 0.031\n", "epoch: 15, batch: 2500 // loss: 0.032\n", "epoch: 15, batch: 2600 // loss: 0.035\n", "epoch: 15, batch: 2700 // loss: 0.033\n", "epoch: 15, batch: 2800 // loss: 0.029\n", "epoch: 15, batch: 2900 // loss: 0.034\n", "epoch: 15, batch: 3000 // loss: 0.036\n", "epoch: 15, batch: 3100 // loss: 0.035\n", "epoch: 15, batch: 3200 // loss: 0.028\n", "epoch: 15, batch: 3300 // loss: 0.028\n", "epoch: 15, batch: 3400 // loss: 0.033\n", "epoch: 15, batch: 3500 // loss: 0.024\n", "epoch: 15, batch: 3600 // loss: 0.030\n", "epoch: 15, batch: 3700 // loss: 0.030\n", "\n", "epoch: 16, batch: 0 // loss: 0.040\n", "epoch: 16, batch: 100 // loss: 0.033\n", "epoch: 16, batch: 200 // loss: 0.030\n", "epoch: 16, batch: 300 // loss: 0.037\n", "epoch: 16, batch: 400 // loss: 0.033\n", "epoch: 16, batch: 500 // loss: 0.031\n", "epoch: 16, batch: 600 // loss: 0.031\n", "epoch: 16, batch: 700 // loss: 0.032\n", "epoch: 16, batch: 800 // loss: 0.029\n", "epoch: 16, batch: 900 // loss: 0.038\n", "epoch: 16, batch: 1000 // loss: 0.035\n", "epoch: 16, batch: 1100 // loss: 0.033\n", "epoch: 16, batch: 1200 // loss: 0.032\n", "epoch: 16, batch: 1300 // loss: 0.036\n", "epoch: 16, batch: 1400 // loss: 0.032\n", "epoch: 16, batch: 1500 // loss: 0.034\n", "epoch: 16, batch: 1600 // loss: 0.038\n", "epoch: 16, batch: 1700 // loss: 0.030\n", "epoch: 16, batch: 1800 // loss: 0.036\n", "epoch: 16, batch: 1900 // loss: 0.029\n", "epoch: 16, batch: 2000 // loss: 0.035\n", "epoch: 16, batch: 2100 // loss: 0.033\n", "epoch: 16, batch: 2200 // loss: 0.035\n", "epoch: 16, batch: 2300 // loss: 0.035\n", "epoch: 16, batch: 2400 // loss: 0.031\n", "epoch: 16, batch: 2500 // loss: 0.031\n", "epoch: 16, batch: 2600 // loss: 0.035\n", "epoch: 16, batch: 2700 // loss: 0.032\n", "epoch: 16, batch: 2800 // loss: 0.029\n", "epoch: 16, batch: 2900 // loss: 0.033\n", "epoch: 16, batch: 3000 // loss: 0.036\n", "epoch: 16, batch: 3100 // loss: 0.034\n", "epoch: 16, batch: 3200 // loss: 0.027\n", "epoch: 16, batch: 3300 // loss: 0.028\n", "epoch: 16, batch: 3400 // loss: 0.032\n", "epoch: 16, batch: 3500 // loss: 0.024\n", "epoch: 16, batch: 3600 // loss: 0.029\n", "epoch: 16, batch: 3700 // loss: 0.029\n", "\n", "epoch: 17, batch: 0 // loss: 0.039\n", "epoch: 17, batch: 100 // loss: 0.032\n", "epoch: 17, batch: 200 // loss: 0.029\n", "epoch: 17, batch: 300 // loss: 0.037\n", "epoch: 17, batch: 400 // loss: 0.033\n", "epoch: 17, batch: 500 // loss: 0.031\n", "epoch: 17, batch: 600 // loss: 0.030\n", "epoch: 17, batch: 700 // loss: 0.032\n", "epoch: 17, batch: 800 // loss: 0.028\n", "epoch: 17, batch: 900 // loss: 0.037\n", "epoch: 17, batch: 1000 // loss: 0.035\n", "epoch: 17, batch: 1100 // loss: 0.032\n", "epoch: 17, batch: 1200 // loss: 0.031\n", "epoch: 17, batch: 1300 // loss: 0.035\n", "epoch: 17, batch: 1400 // loss: 0.031\n", "epoch: 17, batch: 1500 // loss: 0.033\n", "epoch: 17, batch: 1600 // loss: 0.037\n", "epoch: 17, batch: 1700 // loss: 0.030\n", "epoch: 17, batch: 1800 // loss: 0.035\n", "epoch: 17, batch: 1900 // loss: 0.029\n", "epoch: 17, batch: 2000 // loss: 0.034\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "epoch: 17, batch: 2100 // loss: 0.032\n", "epoch: 17, batch: 2200 // loss: 0.034\n", "epoch: 17, batch: 2300 // loss: 0.033\n", "epoch: 17, batch: 2400 // loss: 0.030\n", "epoch: 17, batch: 2500 // loss: 0.030\n", "epoch: 17, batch: 2600 // loss: 0.034\n", "epoch: 17, batch: 2700 // loss: 0.031\n", "epoch: 17, batch: 2800 // loss: 0.028\n", "epoch: 17, batch: 2900 // loss: 0.032\n", "epoch: 17, batch: 3000 // loss: 0.035\n", "epoch: 17, batch: 3100 // loss: 0.034\n", "epoch: 17, batch: 3200 // loss: 0.027\n", "epoch: 17, batch: 3300 // loss: 0.027\n", "epoch: 17, batch: 3400 // loss: 0.031\n", "epoch: 17, batch: 3500 // loss: 0.024\n", "epoch: 17, batch: 3600 // loss: 0.029\n", "epoch: 17, batch: 3700 // loss: 0.028\n", "\n", "epoch: 18, batch: 0 // loss: 0.039\n", "epoch: 18, batch: 100 // loss: 0.031\n", "epoch: 18, batch: 200 // loss: 0.028\n", "epoch: 18, batch: 300 // loss: 0.036\n", "epoch: 18, batch: 400 // loss: 0.032\n", "epoch: 18, batch: 500 // loss: 0.031\n", "epoch: 18, batch: 600 // loss: 0.030\n", "epoch: 18, batch: 700 // loss: 0.031\n", "epoch: 18, batch: 800 // loss: 0.027\n", "epoch: 18, batch: 900 // loss: 0.036\n", "epoch: 18, batch: 1000 // loss: 0.034\n", "epoch: 18, batch: 1100 // loss: 0.031\n", "epoch: 18, batch: 1200 // loss: 0.031\n", "epoch: 18, batch: 1300 // loss: 0.034\n", "epoch: 18, batch: 1400 // loss: 0.031\n", "epoch: 18, batch: 1500 // loss: 0.033\n", "epoch: 18, batch: 1600 // loss: 0.036\n", "epoch: 18, batch: 1700 // loss: 0.030\n", "epoch: 18, batch: 1800 // loss: 0.033\n", "epoch: 18, batch: 1900 // loss: 0.028\n", "epoch: 18, batch: 2000 // loss: 0.033\n", "epoch: 18, batch: 2100 // loss: 0.031\n", "epoch: 18, batch: 2200 // loss: 0.033\n", "epoch: 18, batch: 2300 // loss: 0.032\n", "epoch: 18, batch: 2400 // loss: 0.029\n", "epoch: 18, batch: 2500 // loss: 0.029\n", "epoch: 18, batch: 2600 // loss: 0.033\n", "epoch: 18, batch: 2700 // loss: 0.030\n", "epoch: 18, batch: 2800 // loss: 0.027\n", "epoch: 18, batch: 2900 // loss: 0.031\n", "epoch: 18, batch: 3000 // loss: 0.034\n", "epoch: 18, batch: 3100 // loss: 0.033\n", "epoch: 18, batch: 3200 // loss: 0.026\n", "epoch: 18, batch: 3300 // loss: 0.026\n", "epoch: 18, batch: 3400 // loss: 0.030\n", "epoch: 18, batch: 3500 // loss: 0.023\n", "epoch: 18, batch: 3600 // loss: 0.028\n", "epoch: 18, batch: 3700 // loss: 0.027\n", "\n", "epoch: 19, batch: 0 // loss: 0.038\n", "epoch: 19, batch: 100 // loss: 0.030\n", "epoch: 19, batch: 200 // loss: 0.027\n", "epoch: 19, batch: 300 // loss: 0.035\n", "epoch: 19, batch: 400 // loss: 0.031\n", "epoch: 19, batch: 500 // loss: 0.030\n", "epoch: 19, batch: 600 // loss: 0.029\n", "epoch: 19, batch: 700 // loss: 0.030\n", "epoch: 19, batch: 800 // loss: 0.026\n", "epoch: 19, batch: 900 // loss: 0.036\n", "epoch: 19, batch: 1000 // loss: 0.033\n", "epoch: 19, batch: 1100 // loss: 0.031\n", "epoch: 19, batch: 1200 // loss: 0.030\n", "epoch: 19, batch: 1300 // loss: 0.034\n", "epoch: 19, batch: 1400 // loss: 0.030\n", "epoch: 19, batch: 1500 // loss: 0.033\n", "epoch: 19, batch: 1600 // loss: 0.035\n", "epoch: 19, batch: 1700 // loss: 0.029\n", "epoch: 19, batch: 1800 // loss: 0.032\n", "epoch: 19, batch: 1900 // loss: 0.027\n", "epoch: 19, batch: 2000 // loss: 0.033\n", "epoch: 19, batch: 2100 // loss: 0.030\n", "epoch: 19, batch: 2200 // loss: 0.031\n", "epoch: 19, batch: 2300 // loss: 0.031\n", "epoch: 19, batch: 2400 // loss: 0.029\n", "epoch: 19, batch: 2500 // loss: 0.028\n", "epoch: 19, batch: 2600 // loss: 0.033\n", "epoch: 19, batch: 2700 // loss: 0.029\n", "epoch: 19, batch: 2800 // loss: 0.026\n", "epoch: 19, batch: 2900 // loss: 0.030\n", "epoch: 19, batch: 3000 // loss: 0.033\n", "epoch: 19, batch: 3100 // loss: 0.032\n", "epoch: 19, batch: 3200 // loss: 0.025\n", "epoch: 19, batch: 3300 // loss: 0.025\n", "epoch: 19, batch: 3400 // loss: 0.029\n", "epoch: 19, batch: 3500 // loss: 0.023\n", "epoch: 19, batch: 3600 // loss: 0.027\n", "epoch: 19, batch: 3700 // loss: 0.026\n" ] } ], "source": [ "m = VAE()\n", "optimizer = optim.SGD(m.parameters(), lr=0.01, momentum=0.9)\n", "train_VAE(X, X, m, optimizer, loss_function, EPOCHS=20)" ] }, { "cell_type": "code", "execution_count": 169, "metadata": {}, "outputs": [ { "name": "stderr", "output_type": "stream", "text": [ "/anaconda3/lib/python3.7/site-packages/ipykernel_launcher.py:39: UserWarning: To copy construct from a tensor, it is recommended to use sourceTensor.clone().detach() or sourceTensor.clone().detach().requires_grad_(True), rather than torch.tensor(sourceTensor).\n" ] } ], "source": [ "samples = [m(X[2,:].float())[0].detach().numpy() for _ in range(5)]" ] }, { "cell_type": "code", "execution_count": 174, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "" ] }, "execution_count": 174, "metadata": {}, "output_type": "execute_result" }, { "data": { "image/png": "iVBORw0KGgoAAAANSUhEUgAAAPsAAAD4CAYAAAAq5pAIAAAABHNCSVQICAgIfAhkiAAAAAlwSFlzAAALEgAACxIB0t1+/AAAADh0RVh0U29mdHdhcmUAbWF0cGxvdGxpYiB2ZXJzaW9uMy4xLjEsIGh0dHA6Ly9tYXRwbG90bGliLm9yZy8QZhcZAAASjUlEQVR4nO3dX2hc95UH8O83jv9E8l/FtiwsEXvrxGwIrLsYZyHLkqVsSf3i9KGbGlK8EFZ9aKGFPmzwPjQvC2HZttuHpURdh7pLN6WhDfFDWOqYQuhLiW28ibPaJI7jrSVNJNuKLclOIv85+6Drojqac+S5M3MnPt8PGElzdOce3ZnjOzPn/n4/mhlE5M53V9UJiEh7qNhFklCxiyShYhdJQsUuksTd7dwZSX3034De3l43vnTp0rqxu+7y/z+/du1aQzk1A0k3Pjo62qZM7ixmtuCBLVXsJB8D8EMASwD8u5k9W+b+ZGFPPvmkG+/v768bW7ZsmbvthQsXGsrppiVLlrjxGzdu1I3dfbf/9Nu/f78bV9v49jT8Mp7kEgD/BuBLAB4EsJfkg81KTESaq8x79l0ATpnZaTObBfBzAHuak5aINFuZYt8M4Oy8n0eK2/4IyUGSR0keLbEvESmpzHv2hT4E+NSbKDMbAjAE6AM6kSqVObOPABiY93M/gLFy6YhIq5Qp9tcB3E9yK8llAL4K4FBz0hKRZmOZ9gXJ3QD+FXOtt+fN7J+C378jX8Zv3LjRjU9MTLjxJ554wo1Hrbfly5fXjT388MPutlFrbsWKFW488v7779eNnTp1yt327bffduMvvviiGz9x4kTd2NTUlLvtZ1lL+uxm9gqAV8rch4i0hy6XFUlCxS6ShIpdJAkVu0gSKnaRJFTsIkm0dTz7Z9nq1avrxrq6utxtt23b5sajMeXRMNSBgYG6sXfeecfdNuqj33PPPW784sWLbrxWq9WNXb9+3d12enrajUfXCPT19dWNrVu3zt12ZGTEjUe5dyKd2UWSULGLJKFiF0lCxS6ShIpdJAkVu0gSar0VNmzY4Ma99tjHH3/sbrtp0yY3HrWQojaPN4Q2mv01mmr6ww8/dOMRr7U3NubPdbJy5Uo3HrXPyuQePWZR7p04863O7CJJqNhFklCxiyShYhdJQsUukoSKXSQJFbtIEuqzF6JeuTddsxcDgI8++siNr1mzxo3fe++9bnxycrJu7NKlS+623iqrQNzrnpmZcePeSq3R8Npoumdv2DHg5xY9ZtG1DVu3bnXjp0+fduNV0JldJAkVu0gSKnaRJFTsIkmo2EWSULGLJKFiF0kiTZ896hdHfVdvfHLUR4/2HfW6vT464Pfpr1y54m67atUqNx71m6Px8l6vPLq2Ibr+oLu72417fXxywVWN/8C7PgAAZmdn3Xh0/1WMdy9V7CTPAJgGcB3ANTPb2YykRKT5mnFm/2szO9+E+xGRFtJ7dpEkyha7Afg1yWMkBxf6BZKDJI+SPFpyXyJSQtmX8Y+Y2RjJjQAOk/xfM3tt/i+Y2RCAIQAg2Xmz8IkkUerMbmZjxdcJAC8B2NWMpESk+RoudpLdJFfd/B7AFwGcbFZiItJcZV7G9wJ4qegn3g3gP83sv5qSVQtE/eRo/nRv3vio3xv1XKPx6tGc9p7o746uL4iWbI6uEfDGnEe5vffee2486lV7ffozZ86420Zz+UePacR7vkXHtFENF7uZnQbwZ03MRURaSK03kSRU7CJJqNhFklCxiyShYhdJIs0Q16hVEi3vu379+rqxaBho1NaLpkS+evWqGy/TBopyi1pzUVvQO67T09PuttFU09H23uMSLff8ySefuPGoPRY9Jq1qr3l0ZhdJQsUukoSKXSQJFbtIEip2kSRU7CJJqNhFkkjTZ49EfVevbxoNA436xRMTE258+/btbtzLLZrGOoqfP+/PJdrf3+/Gvdy6urrcbaNrH6Khxd4U35cvX3a3jaa5jqaajqbYVp9dRFpGxS6ShIpdJAkVu0gSKnaRJFTsIkmo2EWSuGP67D09PW48GhMeLcHriaZEXrt2rRtfunRpw/sG/D5+dA1ANCY8mnL5gQcecONeL7xWq7nbRsc14vXxvaWkgXgc/8zMjBuPnm9V0JldJAkVu0gSKnaRJFTsIkmo2EWSULGLJKFiF0nijumzT05OuvGySw+XWTY5moM8mnfeG5cN+EsT9/X1udsODw+78WjcdjQe3vvbo7nVo2sAomWVvesPoryjsfRRHz06bt5j3qo558MzO8nnSU6QPDnvth6Sh0m+W3z1Z34Qkcot5mX8TwA8dsttTwM4Ymb3AzhS/CwiHSwsdjN7DcCtr5H3ADhYfH8QwONNzktEmqzR9+y9ZlYDADOrkdxY7xdJDgIYbHA/ItIkLf+AzsyGAAwBAElr9f5EZGGNtt7GSfYBQPHVnx5VRCrXaLEfArCv+H4fgJebk46ItEr4Mp7kCwAeBbCe5AiA7wJ4FsAvSD4F4PcAvtLKJBcjWmc86nVHfVdvHvGopxrNjx71k7214QF/LH/Us41yHxkZcePRNQLe3x6N84+Oy7Vr19y4l1s0Hj2670g0b7yXW6vmlA+L3cz21gl9ocm5iEgL6XJZkSRU7CJJqNhFklCxiyShYhdJ4o4Z4hq1K6IWU9Sa86Z7jto00bTEGzfWvdoYQDyl8ubNm+vGoqG9Fy9edOPRcYn+du9xKbuc9JUrV9x49Jh7olZuNOzYzL9YNIq3gs7sIkmo2EWSULGLJKFiF0lCxS6ShIpdJAkVu0gSd0yfPRrKGQ3FjPqe3rTE0TTTUby3t9eNe310wJ/2+Ny5c+62US+6zDBSwD9u4+Pj7rbRY+rdN+BPNR093t6QZiDuw5fZvlU9ep3ZRZJQsYskoWIXSULFLpKEil0kCRW7SBIqdpEk7pg+ezR1b9Sz9aZjBvzx7JGoV112zLm3fTTOf2pqyo1H01hfuHDBjXtj9aNeddRPLjOWPjrm0RLg0XGNnm9evFVTSevMLpKEil0kCRW7SBIqdpEkVOwiSajYRZJQsYsk8Znqs3tjr6OebDQHeZl9R+Oqo6WJoz56NG/81atX68a6u7vdbaN54aPcyoiO2+XLl0vdvzeevWyfvKxoHoBWCM/sJJ8nOUHy5LzbniE5SvJE8W93a9MUkbIW8zL+JwAeW+D2H5jZjuLfK81NS0SaLSx2M3sNgH/toIh0vDIf0H2T5BvFy/x19X6J5CDJoySPltiXiJTUaLH/CMDnAOwAUAPwvXq/aGZDZrbTzHY2uC8RaYKGit3Mxs3supndAPBjALuam5aINFtDxU6yb96PXwZwst7vikhnCPvsJF8A8CiA9SRHAHwXwKMkdwAwAGcAfL0ZyUS9Ta+X7vVUgbifHPXCvZ5w1C+enZ1145FoLfD+/v66sZGRkVL7Xr16tRuP+vje3x7NERDdd8S7NiIaCx+NtS8b957rrerBh8VuZnsXuPlAC3IRkRbS5bIiSajYRZJQsYskoWIXSULFLpLEZ2qIq9eu8IZ5AnELKZpSuaurq+FtoyWZo9ZclLu3PHDUUoxaUB988IEbP3v2rBvfvn173Vg0DXV0XKLcve2j1ljU/irbHvOG2JZpQXt0ZhdJQsUukoSKXSQJFbtIEip2kSRU7CJJqNhFkuioPnu07LLXV436pl4vGvCHQwJ+zzbquUb3HeUeDXH1lh++cuWKu+3MzIwbj6axjnq+Zaa5Pn78uBuPrm/whjVHPfpGe9k3RcN3vedM2X3XozO7SBIqdpEkVOwiSajYRZJQsYskoWIXSULFLpJER/XZo96nJ1qCN7rvqC/qLV183333uduOjo668aiXHV0j4C1tHC25HI2Vj6aijpZVHh8frxuLevzR3x1t7z0noudDFI+eb9H8Ct6YdfXZRaQUFbtIEip2kSRU7CJJqNhFklCxiyShYhdJoqP67GXmyy4713a0pLM31j7qB2/YsMGNR2POJyYm3PiaNWsaigHA+fPn3Xj0t0X96Onp6bqx6DHzxukvhtfrjvrgZa75AOI5DMrefyPCMzvJAZK/ITlM8i2S3ypu7yF5mOS7xdd1rU9XRBq1mJfx1wB8x8z+FMBfAPgGyQcBPA3giJndD+BI8bOIdKiw2M2sZmbHi++nAQwD2AxgD4CDxa8dBPB4q5IUkfJu6z07yS0APg/gdwB6zawGzP2HQHJjnW0GAQyWS1NEylp0sZNcCeCXAL5tZlPRhys3mdkQgKHiPlpzhb+IhBbVeiO5FHOF/jMz+1Vx8zjJviLeB8D/yFhEKhWe2Tl3Cj8AYNjMvj8vdAjAPgDPFl9fLptMmaF90bbRdM/RdM6eaKhlNBV0NCVyNIzUyz0a4hq1oKLcomWXvccluu9arebGo7ag104tO4y07PPJi5ddDrqexbyMfwTA1wC8SfJEcdt+zBX5L0g+BeD3AL7SkgxFpCnCYjez3wKo9wb9C81NR0RaRZfLiiShYhdJQsUukoSKXSQJFbtIEh01xLWVouWgI14/OhrOGA2fXbFihRuPpi32esabNm1yt42msY6mmo6G0HrHfdmyZe620d8d5e5tHz1m0dTiZaeajuKtoDO7SBIqdpEkVOwiSajYRZJQsYskoWIXSULFLpJER/XZq5xKOuJNaxz1ZKPxydH2s7OzbtzrZUdj7aPjFvWjx8bG3Hh/f3/dWNQnjx6zaApubxrraBx/9JhFxyV6zKoYz64zu0gSKnaRJFTsIkmo2EWSULGLJKFiF0lCxS6SREf12cv2wj1RPznqdXt92Wj+8i1btrjxaLx7NAe5t/9o3PS6df7iu9E8AN3d3W7cW6763Llz7rbRfPllco/m0/d69EA8nn358uVuPFpLoBV0ZhdJQsUukoSKXSQJFbtIEip2kSRU7CJJqNhFkljM+uwDAH4KYBOAGwCGzOyHJJ8B8PcAbjZL95vZK61KNBKNLy67vTc/el9fn7tt1MNfu3atG494uUf93qifHF2f0NXV5ca9Xno053x031Gv24v39PS420bXAETXPkTj5b3j2qrrTRZTIdcAfMfMjpNcBeAYycNF7Adm9i8tyUxEmmox67PXANSK76dJDgPY3OrERKS5bus9O8ktAD4P4HfFTd8k+QbJ50kueO0iyUGSR0keLZWpiJSy6GInuRLALwF828ymAPwIwOcA7MDcmf97C21nZkNmttPMdjYhXxFp0KKKneRSzBX6z8zsVwBgZuNmdt3MbgD4MYBdrUtTRMoKi51zHxseADBsZt+fd/v8j6C/DOBk89MTkWZZzKfxjwD4GoA3SZ4obtsPYC/JHQAMwBkAX29JhosUtWGi1lo0nNKb9nhqaqrhbYE4t6j95Q31jPYdtQ0nJyfdeJTbQw89VDcWTXMdLWUdteZqtVrdWDT0N1pOOmqtRTqy9WZmvwWwUGaV9dRF5PbpCjqRJFTsIkmo2EWSULGLJKFiF0lCxS6SBFs5ffOndka2b2e3Keqreks2X7p0yd12YGDAjW/fvt2Nv/rqq278ueeeqxuLpqkeHh5246Ojo25869atbnzbtm11Y9E01ceOHXPjBw4ccOOtVGbq8VYzswWb+DqziyShYhdJQsUukoSKXSQJFbtIEip2kSRU7CJJtLvPfg7A/827aT2A821L4PZ0am6dmheg3BrVzNzuM7MF18lua7F/aufk0U6dm65Tc+vUvADl1qh25aaX8SJJqNhFkqi62Icq3r+nU3Pr1LwA5daotuRW6Xt2EWmfqs/sItImKnaRJCopdpKPkXyb5CmST1eRQz0kz5B8k+SJqtenK9bQmyB5ct5tPSQPk3y3+Fp/0vj25/YMydHi2J0gubui3AZI/obkMMm3SH6ruL3SY+fk1Zbj1vb37CSXAHgHwN8AGAHwOoC9ZvY/bU2kDpJnAOw0s8ovwCD5VwBmAPzUzB4qbvtnAJNm9mzxH+U6M/uHDsntGQAzVS/jXaxW1Dd/mXEAjwP4O1R47Jy8/hZtOG5VnNl3AThlZqfNbBbAzwHsqSCPjmdmrwG4dUmWPQAOFt8fxNyTpe3q5NYRzKxmZseL76cB3FxmvNJj5+TVFlUU+2YAZ+f9PILOWu/dAPya5DGSg1Uns4BeM6sBc08eABsrzudW4TLe7XTLMuMdc+waWf68rCqKfaH5sTqp//eImf05gC8B+EbxclUWZ1HLeLfLAsuMd4RGlz8vq4piHwEwfwbGfgBjFeSxIDMbK75OAHgJnbcU9fjNFXSLrxMV5/MHnbSM90LLjKMDjl2Vy59XUeyvA7if5FaSywB8FcChCvL4FJLdxQcnINkN4IvovKWoDwHYV3y/D8DLFebyRzplGe96y4yj4mNX+fLnZtb2fwB2Y+4T+fcA/GMVOdTJ608A/Hfx762qcwPwAuZe1l3F3CuipwDcC+AIgHeLrz0dlNt/AHgTwBuYK6y+inL7S8y9NXwDwIni3+6qj52TV1uOmy6XFUlCV9CJJKFiF0lCxS6ShIpdJAkVu0gSKnaRJFTsIkn8P4nErOlahGiIAAAAAElFTkSuQmCC\n", "text/plain": [ "
" ] }, "metadata": { "needs_background": "light" }, "output_type": "display_data" } ], "source": [ "imshow(np.asarray(samples[4]).reshape(28,28), cmap='gray')" ] }, { "cell_type": "code", "execution_count": 157, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "torch.Size([784])" ] }, "execution_count": 157, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X[0,:].shape" ] }, { "cell_type": "code", "execution_count": 156, "metadata": {}, "outputs": [ { "data": { "text/plain": [ "torch.Size([60000, 784])" ] }, "execution_count": 156, "metadata": {}, "output_type": "execute_result" } ], "source": [ "X.shape" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.7.3" } }, "nbformat": 4, "nbformat_minor": 2 }