From 6ce67fbdf6200a8f203a5893d67b2f4b3ffa84ad Mon Sep 17 00:00:00 2001 From: Steffen Schneider Date: Wed, 24 May 2023 03:15:37 +0200 Subject: [PATCH 1/2] Add notebook (incl solution) for week 11 --- week11/week11.ipynb | 3174 +++++++++++++++++++++++++++++++++++++++++++ 1 file changed, 3174 insertions(+) create mode 100644 week11/week11.ipynb diff --git a/week11/week11.ipynb b/week11/week11.ipynb new file mode 100644 index 0000000..aa4630d --- /dev/null +++ b/week11/week11.ipynb @@ -0,0 +1,3174 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "source": [ + "# Continual learning: Overcoming catastophic forgetting with memory replay\n", + "\n", + "In this exercise class we'll implement an experiment to measure catastrophic forgetting in a neural network trained on MNIST. We will then fix/reduce the catastrophic forgetting by implementing a simple memory replay strategy." + ], + "metadata": { + "id": "lDTvzuBtNg1X" + } + }, + { + "cell_type": "markdown", + "metadata": { + "id": "Mzy1CzlGQvAk" + }, + "source": [ + "The following figure highlights the setup of the dataset and is taken from [van den Ven & Tolias, 2019](https://arxiv.org/pdf/1904.07734.pdf):\n", + "\n", + "![image.png]()" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": { + "id": "MN_GMVuyPD9D" + }, + "outputs": [], + "source": [ + "\"\"\"\n", + "Code adapted from the torchvision MNIST example:\n", + "https://github.com/pytorch/examples/blob/main/mnist/main.py\n", + "\n", + "BSD 3-Clause License\n", + "\n", + "Copyright (c) 2017, \n", + "All rights reserved.\n", + "\n", + "Redistribution and use in source and binary forms, with or without\n", + "modification, are permitted provided that the following conditions are met:\n", + "\n", + "* Redistributions of source code must retain the above copyright notice, this\n", + " list of conditions and the following disclaimer.\n", + "\n", + "* Redistributions in binary form must reproduce the above copyright notice,\n", + " this list of conditions and the following disclaimer in the documentation\n", + " and/or other materials provided with the distribution.\n", + "\n", + "* Neither the name of the copyright holder nor the names of its\n", + " contributors may be used to endorse or promote products derived from\n", + " this software without specific prior written permission.\n", + "\n", + "THIS SOFTWARE IS PROVIDED BY THE COPYRIGHT HOLDERS AND CONTRIBUTORS \"AS IS\"\n", + "AND ANY EXPRESS OR IMPLIED WARRANTIES, INCLUDING, BUT NOT LIMITED TO, THE\n", + "IMPLIED WARRANTIES OF MERCHANTABILITY AND FITNESS FOR A PARTICULAR PURPOSE ARE\n", + "DISCLAIMED. IN NO EVENT SHALL THE COPYRIGHT HOLDER OR CONTRIBUTORS BE LIABLE\n", + "FOR ANY DIRECT, INDIRECT, INCIDENTAL, SPECIAL, EXEMPLARY, OR CONSEQUENTIAL\n", + "DAMAGES (INCLUDING, BUT NOT LIMITED TO, PROCUREMENT OF SUBSTITUTE GOODS OR\n", + "SERVICES; LOSS OF USE, DATA, OR PROFITS; OR BUSINESS INTERRUPTION) HOWEVER\n", + "CAUSED AND ON ANY THEORY OF LIABILITY, WHETHER IN CONTRACT, STRICT LIABILITY,\n", + "OR TORT (INCLUDING NEGLIGENCE OR OTHERWISE) ARISING IN ANY WAY OUT OF THE USE\n", + "OF THIS SOFTWARE, EVEN IF ADVISED OF THE POSSIBILITY OF SUCH DAMAGE.\n", + "\"\"\"\n", + "\n", + "import argparse\n", + "import torch\n", + "import torch.nn as nn\n", + "import torch.nn.functional as F\n", + "import torch.optim as optim\n", + "from torchvision import datasets, transforms\n", + "from torch.optim.lr_scheduler import StepLR" + ] + }, + { + "cell_type": "code", + "execution_count": 3, + "metadata": { + "id": "Bu5GtxDyPMW5" + }, + "outputs": [], + "source": [ + "# Network implementation -- bonus exercise: Modify the network architecture,\n", + "# and study the effect on the training results.\n", + "\n", + "class Net(nn.Module):\n", + "\n", + " def __init__(self):\n", + " super(Net, self).__init__()\n", + " self.conv1 = nn.Conv2d(1, 32, 3, 1)\n", + " self.conv2 = nn.Conv2d(32, 64, 3, 1)\n", + " self.dropout1 = nn.Dropout(0.25)\n", + " self.dropout2 = nn.Dropout(0.5)\n", + " self.fc1 = nn.Linear(9216, 128)\n", + " self.fc2 = nn.Linear(128, 10)\n", + "\n", + " def forward(self, x):\n", + " x = self.conv1(x)\n", + " x = F.relu(x)\n", + " x = self.conv2(x)\n", + " x = F.relu(x)\n", + " x = F.max_pool2d(x, 2)\n", + " x = self.dropout1(x)\n", + " x = torch.flatten(x, 1)\n", + " x = self.fc1(x)\n", + " x = F.relu(x)\n", + " x = self.dropout2(x)\n", + " x = self.fc2(x)\n", + " output = F.log_softmax(x, dim=1)\n", + " return output" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "metadata": { + "id": "FljvS0QcPPTg" + }, + "outputs": [], + "source": [ + "# Exercise: Adapt the following function and store part of the images\n", + "# presented during training in a replay buffer. Replay these images\n", + "# during the training step.\n", + "\n", + "def train(args, model, device, train_loader, optimizer, epoch, buffer = None):\n", + " model.train()\n", + "\n", + " for batch_idx, (data, target) in enumerate(train_loader):\n", + "\n", + " ### START SOLUTION ###\n", + " # We append images and labels from the first training batch\n", + " # to our buffer. You can extend this strategy based on how\n", + " # many images you choose to store in the buffer.\n", + " if buffer is not None and batch_idx == 0:\n", + " if buffer is not None:\n", + " images, targets = next(iter(train_loader))\n", + " buffer.add(images, targets)\n", + " ### END SOLUTION ###\n", + "\n", + "\n", + " data, target = data.to(device), target.to(device)\n", + "\n", + " optimizer.zero_grad()\n", + " output = model(data)\n", + " loss = F.nll_loss(output, target)\n", + " loss.backward()\n", + " optimizer.step()\n", + "\n", + " ### START SOLUTION ###\n", + " # A simple strategy for overcoming forgetting is to retrieve images\n", + " # from the buffer (here: one image per class) and perform a gradient\n", + " # step on these images along with every incoming new batch.\n", + " if buffer is not None and len(buffer) > 0:\n", + " replayed_images, replayed_targets = buffer.get()\n", + " replayed_images = replayed_images.to(device)\n", + " replayed_targets = replayed_targets.to(device)\n", + " optimizer.zero_grad()\n", + " output = model(replayed_images)\n", + " loss = F.nll_loss(output, replayed_targets)\n", + " loss.backward()\n", + " optimizer.step()\n", + " ### END SOLUTION ###\n", + "\n", + " if batch_idx % args.log_interval == 0:\n", + " print('Train Epoch: {} [{}/{} ({:.0f}%)]\\tLoss: {:.6f}'.format(\n", + " epoch, batch_idx * len(data), len(train_loader.dataset),\n", + " 100. * batch_idx / len(train_loader), loss.item()))\n", + " if args.dry_run:\n", + " break" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "metadata": { + "id": "QXPgWNCRPRd4" + }, + "outputs": [], + "source": [ + "# The test routine was adapted from the original implementation and now computes\n", + "# the classification probabilities per class instead of an average. This allows to\n", + "# later assess the effect of catastrophic forgetting. No adaptations in this function\n", + "# are required for the exercise.\n", + "\n", + "import collections\n", + "\n", + "def test(model, device, test_loader):\n", + " model.eval()\n", + " test_loss = 0\n", + " correct_by_class = collections.Counter()\n", + " count_by_class = collections.Counter()\n", + " with torch.no_grad():\n", + " for data, target in test_loader:\n", + " data, target = data.to(device), target.to(device)\n", + " output = model(data)\n", + " test_loss += F.nll_loss(output, target, reduction='sum').item() # sum up batch loss\n", + " pred = output.argmax(dim=1, keepdim=True) # get the index of the max log-probability\n", + " correct = pred.eq(target.view_as(pred)).float()\n", + " for class_ in range(10):\n", + " idc = (target == class_)\n", + " correct_by_class[class_] += correct[idc].sum().item()\n", + " count_by_class[class_] += idc.sum().item()\n", + "\n", + " test_loss /= len(test_loader.dataset)\n", + " test_acc = correct / len(test_loader.dataset)\n", + "\n", + " print(f'\\nTest set: Average loss: {test_loss:.4f}')\n", + " result = {}\n", + " for class_ in range(10):\n", + " acc = correct_by_class[class_] / count_by_class[class_]\n", + " result[class_] = acc\n", + " print(\n", + " f\"Class {class_} accuracy: \"\n", + " f\"{correct_by_class[class_]}/{count_by_class[class_]}\"\n", + " f\"({acc*100:.0f}%)\"\n", + " )\n", + "\n", + " return result" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": { + "id": "UsdJlkLkRRbp" + }, + "outputs": [], + "source": [ + "# Exercise: Adapt the dataset class \"MNISTContinualLearning\" for the experiment\n", + "# outlined in the introduction text. The class needs to support indexing of the\n", + "# dataset based on the provided list of classes.\n", + "\n", + "def identity(x):\n", + " return\n", + "\n", + "class MNISTContinualLearning(datasets.MNIST):\n", + "\n", + " def __init__(self, *args, classes=list(range(10)), **kwargs):\n", + "\n", + " # This inherits from the base dataset\n", + " super().__init__(*args, **kwargs)\n", + "\n", + " if len(classes) < 2:\n", + " raise ValueError(f\"Need at least two classes, but got {len(classes)}\")\n", + "\n", + " # Add code for filtering the dataset here. You need to adapt\n", + " # the \"data\" and \"targets\" attribute of the dataset. The \"data\"\n", + " # attribute stores the images as a numpy array, while the \"targets\"\n", + " # attributes stores the labels as a numpy array.\n", + " # You can override the existing attributes.\n", + " #\n", + " # self.data = ...\n", + " # self.targets = ...\n", + " \n", + " ### START SOLUTION ###\n", + " idc = None\n", + " for class_ in classes:\n", + " if idc is None:\n", + " idc = self.targets == class_\n", + " idc |= self.targets == class_\n", + "\n", + " self.data = self.data[idc]\n", + " self.targets = self.targets[idc]\n", + " ### END SOLUTION ###\n", + "\n", + "\n", + "def test_dataset():\n", + " transform=transforms.Compose([\n", + " transforms.ToTensor(),\n", + " transforms.Normalize((0.1307,), (0.3081,))\n", + " ])\n", + " dataset1 = MNISTContinualLearning('../data', train=True, download=True, transform=transform, classes = [0, 5])\n", + " assert len(dataset1) == 11344\n", + "\n", + "test_dataset()" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": { + "id": "EDwtthksNUpw" + }, + "outputs": [], + "source": [ + "# To implement memory replay, add additional code (functions or classes)\n", + "# to this cell. One possible solution is to implement a \"Buffer\" class\n", + "# that allows to add images into memory, and allows to retrieve the stored\n", + "# images and labels for training the model.\n", + "#\n", + "# The buffer is typically memory constrained, and there are multiple ways\n", + "# to efficiently compress the individual elements present in the buffer.\n", + "# Think about different ways of reducing the storage required by your buffer\n", + "# class, and explore which of them is most effective at mitigating catastophic\n", + "# forgetting.\n", + "\n", + "\n", + "### START SOLUTION ###\n", + "\n", + "class Buffer(nn.Module):\n", + "\n", + " def __init__(self):\n", + " self.buffer = {}\n", + " \n", + " def add(self, images, targets):\n", + " for class_ in targets.unique():\n", + " idc = targets == class_\n", + " self.buffer[class_] = images[idc][0]\n", + "\n", + " def get(self):\n", + " assert len(self) > 0\n", + " keys = list(self.buffer.keys())\n", + " targets = torch.tensor(keys)\n", + " images = torch.stack([self.buffer[k] for k in keys], dim = 0)\n", + " assert len(targets) == len(images)\n", + " return images, targets\n", + "\n", + " def __len__(self):\n", + " return sum(len(v) if v is not None else 0 for v in self.buffer.values())\n", + " \n", + "### END SOLUTION ###" + ] + }, + { + "cell_type": "code", + "execution_count": 12, + "metadata": { + "id": "u2xvlBoZPTyx" + }, + "outputs": [], + "source": [ + "# Adapt the main training loop to work with the functions you defined above.\n", + "\n", + "def train_model(args, model, phase, replay_buffer = [], history = [], buffer = None):\n", + " use_cuda = not args.no_cuda and torch.cuda.is_available()\n", + " device = torch.device(\"cuda\" if use_cuda else \"cpu\")\n", + "\n", + " torch.manual_seed(args.seed)\n", + "\n", + " train_kwargs = {'batch_size': args.batch_size}\n", + " test_kwargs = {'batch_size': args.test_batch_size}\n", + " if use_cuda:\n", + " cuda_kwargs = {'num_workers': 1,\n", + " 'pin_memory': True,\n", + " 'shuffle': True}\n", + " train_kwargs.update(cuda_kwargs)\n", + " test_kwargs.update(cuda_kwargs)\n", + "\n", + " transform=transforms.Compose([\n", + " transforms.ToTensor(),\n", + " transforms.Normalize((0.1307,), (0.3081,))\n", + " ])\n", + " \n", + " # You need to replace the original MNIST dataset here by the continual\n", + " # learning dataset we implemented in the previous cell. Make sure to\n", + " # pass the list of classes selected for training in args.train_classes.\n", + " \n", + " ### START SOLUTION ###\n", + " # We added the revised MNIST class here, which takes the same arguments\n", + " # as the original class, but additionally takes a \"classes\" argument which\n", + " # specifies the subselection of classes to consider during this training\n", + " # phase.\n", + " dataset1 = MNISTContinualLearning('../data', train=True, download=True,\n", + " transform=transform, classes=args.train_classes)\n", + " ### END SOLUTION ###\n", + " dataset2 = datasets.MNIST('../data', train=False, download=True,\n", + " transform=transform)\n", + " train_loader = torch.utils.data.DataLoader(dataset1,**train_kwargs)\n", + " test_loader = torch.utils.data.DataLoader(dataset2, **test_kwargs)\n", + "\n", + " model = model.to(device)\n", + " optimizer = optim.Adadelta(model.parameters(), lr=args.lr)\n", + " scheduler = StepLR(optimizer, step_size=1, gamma=args.gamma)\n", + "\n", + " for epoch in range(1, args.epochs + 1):\n", + " ### START SOLUTION ###\n", + " # We additionally pass the \"buffer\" class here to collect training\n", + " # images for later memory replay.\n", + " # \n", + " # Original content:\n", + " # train(args, model, device, train_loader, optimizer, epoch)\n", + " train(args, model, device, train_loader, optimizer, epoch, buffer)\n", + " ### END SOLUTION ###\n", + " test_results = test(model, device, test_loader)\n", + " test_results[\"phase\"] = phase\n", + " history.append(test_results)\n", + " scheduler.step()\n", + "\n", + " return history\n" + ] + }, + { + "cell_type": "code", + "source": [ + "# We now define the experiment setup.\n", + "# Without modifications to the code, the following will simply train an MNIST\n", + "# network multiple times, and reach an accuracy of >99% on the test set.\n", + "#\n", + "# The result will be modified in two steps:\n", + "#\n", + "# -- first, after implementing the MNISTContinualLearning dataset, you will be\n", + "# able to observe catastrophic forgetting: Training on a new task (specified)\n", + "# by the \"phase\" and \"config.train_classes\" variables will make the network\n", + "# forget the previously learned tasks, and you will observe a performance drop.\n", + "#\n", + "# -- second, after implementing the catastrophic forgetting network, you will\n", + "# fix the catastrophic forgetting my implementing a simple memory buffer. This\n", + "# buffer will keep some of the images seen in each individual training phase,\n", + "# and add them to the training in each subsequent phase. This task is open-ended\n", + "# and different strategies exist. They will differ in terms of memory efficiency\n", + "# and performance.\n", + "\n", + "# You should adapt the train config to each experiment setup and especially test the\n", + "# effects of taking different values for the number of epochs (per phase of the training)\n", + "# and the learning rate used.\n", + "config = argparse.Namespace(\n", + " batch_size=64, \n", + " test_batch_size=1000, \n", + " epochs=5, \n", + " lr=0.001,\n", + " gamma=0.7,\n", + " no_cuda=False,\n", + " dry_run=False,\n", + " seed=1,\n", + " log_interval=10,\n", + " save_model=False\n", + ")\n", + "\n", + "def train_regular_mnist():\n", + " model = Net()\n", + " history = []\n", + "\n", + " config.train_classes = [0, 1, 2, 3, 4, 5, 6, 7, 8, 9]\n", + " train_model(config, model, phase = \"baseline\", history = history)\n", + " return history\n", + "\n", + "history_regular_mnist = train_regular_mnist()\n", + "history_regular_mnist" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "SK-GNifLPN2S", + "outputId": "9cd9a6a2-9b54-46c8-a072-fcd66b995364" + }, + "execution_count": 14, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Train Epoch: 1 [0/60000 (0%)]\tLoss: 2.295775\n", + "Train Epoch: 1 [640/60000 (1%)]\tLoss: 2.290210\n", + "Train Epoch: 1 [1280/60000 (2%)]\tLoss: 2.310344\n", + "Train Epoch: 1 [1920/60000 (3%)]\tLoss: 2.292868\n", + "Train Epoch: 1 [2560/60000 (4%)]\tLoss: 2.290216\n", + "Train Epoch: 1 [3200/60000 (5%)]\tLoss: 2.276424\n", + "Train Epoch: 1 [3840/60000 (6%)]\tLoss: 2.281419\n", + "Train Epoch: 1 [4480/60000 (7%)]\tLoss: 2.276124\n", + "Train Epoch: 1 [5120/60000 (9%)]\tLoss: 2.267236\n", + "Train Epoch: 1 [5760/60000 (10%)]\tLoss: 2.294219\n", + "Train Epoch: 1 [6400/60000 (11%)]\tLoss: 2.254271\n", + "Train Epoch: 1 [7040/60000 (12%)]\tLoss: 2.264095\n", + "Train Epoch: 1 [7680/60000 (13%)]\tLoss: 2.256358\n", + "Train Epoch: 1 [8320/60000 (14%)]\tLoss: 2.274228\n", + "Train Epoch: 1 [8960/60000 (15%)]\tLoss: 2.269273\n", + "Train Epoch: 1 [9600/60000 (16%)]\tLoss: 2.240185\n", + "Train Epoch: 1 [10240/60000 (17%)]\tLoss: 2.248815\n", + "Train Epoch: 1 [10880/60000 (18%)]\tLoss: 2.223281\n", + "Train Epoch: 1 [11520/60000 (19%)]\tLoss: 2.222255\n", + "Train Epoch: 1 [12160/60000 (20%)]\tLoss: 2.233015\n", + "Train Epoch: 1 [12800/60000 (21%)]\tLoss: 2.211506\n", + "Train Epoch: 1 [13440/60000 (22%)]\tLoss: 2.234103\n", + "Train Epoch: 1 [14080/60000 (23%)]\tLoss: 2.225921\n", + "Train Epoch: 1 [14720/60000 (25%)]\tLoss: 2.202645\n", + "Train Epoch: 1 [15360/60000 (26%)]\tLoss: 2.196408\n", + "Train Epoch: 1 [16000/60000 (27%)]\tLoss: 2.202403\n", + "Train Epoch: 1 [16640/60000 (28%)]\tLoss: 2.209469\n", + "Train Epoch: 1 [17280/60000 (29%)]\tLoss: 2.180980\n", + "Train Epoch: 1 [17920/60000 (30%)]\tLoss: 2.153812\n", + "Train Epoch: 1 [18560/60000 (31%)]\tLoss: 2.150105\n", + "Train Epoch: 1 [19200/60000 (32%)]\tLoss: 2.158034\n", + "Train Epoch: 1 [19840/60000 (33%)]\tLoss: 2.172502\n", + "Train Epoch: 1 [20480/60000 (34%)]\tLoss: 2.093013\n", + "Train Epoch: 1 [21120/60000 (35%)]\tLoss: 2.130392\n", + "Train Epoch: 1 [21760/60000 (36%)]\tLoss: 2.172241\n", + "Train Epoch: 1 [22400/60000 (37%)]\tLoss: 2.162427\n", + "Train Epoch: 1 [23040/60000 (38%)]\tLoss: 2.168904\n", + "Train Epoch: 1 [23680/60000 (39%)]\tLoss: 2.179659\n", + "Train Epoch: 1 [24320/60000 (41%)]\tLoss: 2.163229\n", + "Train Epoch: 1 [24960/60000 (42%)]\tLoss: 2.126366\n", + "Train Epoch: 1 [25600/60000 (43%)]\tLoss: 2.138455\n", + "Train Epoch: 1 [26240/60000 (44%)]\tLoss: 2.113500\n", + "Train Epoch: 1 [26880/60000 (45%)]\tLoss: 2.067201\n", + "Train Epoch: 1 [27520/60000 (46%)]\tLoss: 2.114285\n", + "Train Epoch: 1 [28160/60000 (47%)]\tLoss: 2.036888\n", + "Train Epoch: 1 [28800/60000 (48%)]\tLoss: 2.068524\n", + "Train Epoch: 1 [29440/60000 (49%)]\tLoss: 2.097640\n", + "Train Epoch: 1 [30080/60000 (50%)]\tLoss: 2.028418\n", + "Train Epoch: 1 [30720/60000 (51%)]\tLoss: 2.031548\n", + "Train Epoch: 1 [31360/60000 (52%)]\tLoss: 2.051078\n", + "Train Epoch: 1 [32000/60000 (53%)]\tLoss: 2.028303\n", + "Train Epoch: 1 [32640/60000 (54%)]\tLoss: 1.983975\n", + "Train Epoch: 1 [33280/60000 (55%)]\tLoss: 2.043919\n", + "Train Epoch: 1 [33920/60000 (57%)]\tLoss: 1.980050\n", + "Train Epoch: 1 [34560/60000 (58%)]\tLoss: 1.970208\n", + "Train Epoch: 1 [35200/60000 (59%)]\tLoss: 2.048699\n", + "Train Epoch: 1 [35840/60000 (60%)]\tLoss: 1.956716\n", + "Train Epoch: 1 [36480/60000 (61%)]\tLoss: 1.987072\n", + "Train Epoch: 1 [37120/60000 (62%)]\tLoss: 1.984343\n", + "Train Epoch: 1 [37760/60000 (63%)]\tLoss: 1.947972\n", + "Train Epoch: 1 [38400/60000 (64%)]\tLoss: 1.938421\n", + "Train Epoch: 1 [39040/60000 (65%)]\tLoss: 1.919820\n", + "Train Epoch: 1 [39680/60000 (66%)]\tLoss: 1.931831\n", + "Train Epoch: 1 [40320/60000 (67%)]\tLoss: 1.953799\n", + "Train Epoch: 1 [40960/60000 (68%)]\tLoss: 1.883609\n", + "Train Epoch: 1 [41600/60000 (69%)]\tLoss: 1.876115\n", + "Train Epoch: 1 [42240/60000 (70%)]\tLoss: 1.870510\n", + "Train Epoch: 1 [42880/60000 (71%)]\tLoss: 1.910781\n", + "Train Epoch: 1 [43520/60000 (72%)]\tLoss: 1.950781\n", + "Train Epoch: 1 [44160/60000 (74%)]\tLoss: 1.985367\n", + "Train Epoch: 1 [44800/60000 (75%)]\tLoss: 1.823831\n", + "Train Epoch: 1 [45440/60000 (76%)]\tLoss: 1.870280\n", + "Train Epoch: 1 [46080/60000 (77%)]\tLoss: 1.794647\n", + "Train Epoch: 1 [46720/60000 (78%)]\tLoss: 1.864569\n", + "Train Epoch: 1 [47360/60000 (79%)]\tLoss: 1.871643\n", + "Train Epoch: 1 [48000/60000 (80%)]\tLoss: 1.794408\n", + "Train Epoch: 1 [48640/60000 (81%)]\tLoss: 1.836012\n", + "Train Epoch: 1 [49280/60000 (82%)]\tLoss: 1.784632\n", + "Train Epoch: 1 [49920/60000 (83%)]\tLoss: 1.775053\n", + "Train Epoch: 1 [50560/60000 (84%)]\tLoss: 1.691660\n", + "Train Epoch: 1 [51200/60000 (85%)]\tLoss: 1.818502\n", + "Train Epoch: 1 [51840/60000 (86%)]\tLoss: 1.792987\n", + "Train Epoch: 1 [52480/60000 (87%)]\tLoss: 1.763221\n", + "Train Epoch: 1 [53120/60000 (88%)]\tLoss: 1.779346\n", + "Train Epoch: 1 [53760/60000 (90%)]\tLoss: 1.678108\n", + "Train Epoch: 1 [54400/60000 (91%)]\tLoss: 1.780516\n", + "Train Epoch: 1 [55040/60000 (92%)]\tLoss: 1.650490\n", + "Train Epoch: 1 [55680/60000 (93%)]\tLoss: 1.704799\n", + "Train Epoch: 1 [56320/60000 (94%)]\tLoss: 1.720001\n", + "Train Epoch: 1 [56960/60000 (95%)]\tLoss: 1.716193\n", + "Train Epoch: 1 [57600/60000 (96%)]\tLoss: 1.665386\n", + "Train Epoch: 1 [58240/60000 (97%)]\tLoss: 1.669093\n", + "Train Epoch: 1 [58880/60000 (98%)]\tLoss: 1.669740\n", + "Train Epoch: 1 [59520/60000 (99%)]\tLoss: 1.576309\n", + "\n", + "Test set: Average loss: 1.5640\n", + "Class 0 accuracy: 942.0/980(96%)\n", + "Class 1 accuracy: 1049.0/1135(92%)\n", + "Class 2 accuracy: 530.0/1032(51%)\n", + "Class 3 accuracy: 928.0/1010(92%)\n", + "Class 4 accuracy: 747.0/982(76%)\n", + "Class 5 accuracy: 299.0/892(34%)\n", + "Class 6 accuracy: 880.0/958(92%)\n", + "Class 7 accuracy: 851.0/1028(83%)\n", + "Class 8 accuracy: 744.0/974(76%)\n", + "Class 9 accuracy: 788.0/1009(78%)\n", + "Train Epoch: 2 [0/60000 (0%)]\tLoss: 1.627061\n", + "Train Epoch: 2 [640/60000 (1%)]\tLoss: 1.545597\n", + "Train Epoch: 2 [1280/60000 (2%)]\tLoss: 1.698457\n", + "Train Epoch: 2 [1920/60000 (3%)]\tLoss: 1.572205\n", + "Train Epoch: 2 [2560/60000 (4%)]\tLoss: 1.636262\n", + "Train Epoch: 2 [3200/60000 (5%)]\tLoss: 1.641547\n", + "Train Epoch: 2 [3840/60000 (6%)]\tLoss: 1.528854\n", + "Train Epoch: 2 [4480/60000 (7%)]\tLoss: 1.606497\n", + "Train Epoch: 2 [5120/60000 (9%)]\tLoss: 1.548691\n", + "Train Epoch: 2 [5760/60000 (10%)]\tLoss: 1.562155\n", + "Train Epoch: 2 [6400/60000 (11%)]\tLoss: 1.498272\n", + "Train Epoch: 2 [7040/60000 (12%)]\tLoss: 1.519710\n", + "Train Epoch: 2 [7680/60000 (13%)]\tLoss: 1.605046\n", + "Train Epoch: 2 [8320/60000 (14%)]\tLoss: 1.567077\n", + "Train Epoch: 2 [8960/60000 (15%)]\tLoss: 1.434826\n", + "Train Epoch: 2 [9600/60000 (16%)]\tLoss: 1.478333\n", + "Train Epoch: 2 [10240/60000 (17%)]\tLoss: 1.479111\n", + "Train Epoch: 2 [10880/60000 (18%)]\tLoss: 1.503707\n", + "Train Epoch: 2 [11520/60000 (19%)]\tLoss: 1.373165\n", + "Train Epoch: 2 [12160/60000 (20%)]\tLoss: 1.460236\n", + "Train Epoch: 2 [12800/60000 (21%)]\tLoss: 1.565628\n", + "Train Epoch: 2 [13440/60000 (22%)]\tLoss: 1.565041\n", + "Train Epoch: 2 [14080/60000 (23%)]\tLoss: 1.426577\n", + "Train Epoch: 2 [14720/60000 (25%)]\tLoss: 1.531582\n", + "Train Epoch: 2 [15360/60000 (26%)]\tLoss: 1.427804\n", + "Train Epoch: 2 [16000/60000 (27%)]\tLoss: 1.453471\n", + "Train Epoch: 2 [16640/60000 (28%)]\tLoss: 1.528445\n", + "Train Epoch: 2 [17280/60000 (29%)]\tLoss: 1.515689\n", + "Train Epoch: 2 [17920/60000 (30%)]\tLoss: 1.517196\n", + "Train Epoch: 2 [18560/60000 (31%)]\tLoss: 1.446620\n", + "Train Epoch: 2 [19200/60000 (32%)]\tLoss: 1.496210\n", + "Train Epoch: 2 [19840/60000 (33%)]\tLoss: 1.423505\n", + "Train Epoch: 2 [20480/60000 (34%)]\tLoss: 1.415124\n", + "Train Epoch: 2 [21120/60000 (35%)]\tLoss: 1.544892\n", + "Train Epoch: 2 [21760/60000 (36%)]\tLoss: 1.340283\n", + "Train Epoch: 2 [22400/60000 (37%)]\tLoss: 1.363816\n", + "Train Epoch: 2 [23040/60000 (38%)]\tLoss: 1.382646\n", + "Train Epoch: 2 [23680/60000 (39%)]\tLoss: 1.264206\n", + "Train Epoch: 2 [24320/60000 (41%)]\tLoss: 1.332618\n", + "Train Epoch: 2 [24960/60000 (42%)]\tLoss: 1.358470\n", + "Train Epoch: 2 [25600/60000 (43%)]\tLoss: 1.344868\n", + "Train Epoch: 2 [26240/60000 (44%)]\tLoss: 1.327641\n", + "Train Epoch: 2 [26880/60000 (45%)]\tLoss: 1.382141\n", + "Train Epoch: 2 [27520/60000 (46%)]\tLoss: 1.403416\n", + "Train Epoch: 2 [28160/60000 (47%)]\tLoss: 1.420001\n", + "Train Epoch: 2 [28800/60000 (48%)]\tLoss: 1.414284\n", + "Train Epoch: 2 [29440/60000 (49%)]\tLoss: 1.367697\n", + "Train Epoch: 2 [30080/60000 (50%)]\tLoss: 1.498880\n", + "Train Epoch: 2 [30720/60000 (51%)]\tLoss: 1.278797\n", + "Train Epoch: 2 [31360/60000 (52%)]\tLoss: 1.333852\n", + "Train Epoch: 2 [32000/60000 (53%)]\tLoss: 1.370776\n", + "Train Epoch: 2 [32640/60000 (54%)]\tLoss: 1.062860\n", + "Train Epoch: 2 [33280/60000 (55%)]\tLoss: 1.245440\n", + "Train Epoch: 2 [33920/60000 (57%)]\tLoss: 1.152776\n", + "Train Epoch: 2 [34560/60000 (58%)]\tLoss: 1.344226\n", + "Train Epoch: 2 [35200/60000 (59%)]\tLoss: 1.242468\n", + "Train Epoch: 2 [35840/60000 (60%)]\tLoss: 1.353402\n", + "Train Epoch: 2 [36480/60000 (61%)]\tLoss: 1.166169\n", + "Train Epoch: 2 [37120/60000 (62%)]\tLoss: 1.165925\n", + "Train Epoch: 2 [37760/60000 (63%)]\tLoss: 1.237298\n", + "Train Epoch: 2 [38400/60000 (64%)]\tLoss: 1.209161\n", + "Train Epoch: 2 [39040/60000 (65%)]\tLoss: 1.284919\n", + "Train Epoch: 2 [39680/60000 (66%)]\tLoss: 1.301399\n", + "Train Epoch: 2 [40320/60000 (67%)]\tLoss: 1.257363\n", + "Train Epoch: 2 [40960/60000 (68%)]\tLoss: 1.199494\n", + "Train Epoch: 2 [41600/60000 (69%)]\tLoss: 1.113902\n", + "Train Epoch: 2 [42240/60000 (70%)]\tLoss: 1.155495\n", + "Train Epoch: 2 [42880/60000 (71%)]\tLoss: 1.227993\n", + "Train Epoch: 2 [43520/60000 (72%)]\tLoss: 1.231888\n", + "Train Epoch: 2 [44160/60000 (74%)]\tLoss: 1.373095\n", + "Train Epoch: 2 [44800/60000 (75%)]\tLoss: 1.248195\n", + "Train Epoch: 2 [45440/60000 (76%)]\tLoss: 1.127467\n", + "Train Epoch: 2 [46080/60000 (77%)]\tLoss: 1.045080\n", + "Train Epoch: 2 [46720/60000 (78%)]\tLoss: 1.206602\n", + "Train Epoch: 2 [47360/60000 (79%)]\tLoss: 1.128123\n", + "Train Epoch: 2 [48000/60000 (80%)]\tLoss: 1.348677\n", + "Train Epoch: 2 [48640/60000 (81%)]\tLoss: 1.197632\n", + "Train Epoch: 2 [49280/60000 (82%)]\tLoss: 1.165728\n", + "Train Epoch: 2 [49920/60000 (83%)]\tLoss: 1.209910\n", + "Train Epoch: 2 [50560/60000 (84%)]\tLoss: 1.137662\n", + "Train Epoch: 2 [51200/60000 (85%)]\tLoss: 1.109170\n", + "Train Epoch: 2 [51840/60000 (86%)]\tLoss: 1.038135\n", + "Train Epoch: 2 [52480/60000 (87%)]\tLoss: 1.092770\n", + "Train Epoch: 2 [53120/60000 (88%)]\tLoss: 1.205910\n", + "Train Epoch: 2 [53760/60000 (90%)]\tLoss: 0.988055\n", + "Train Epoch: 2 [54400/60000 (91%)]\tLoss: 1.205869\n", + "Train Epoch: 2 [55040/60000 (92%)]\tLoss: 1.149507\n", + "Train Epoch: 2 [55680/60000 (93%)]\tLoss: 1.059419\n", + "Train Epoch: 2 [56320/60000 (94%)]\tLoss: 1.130637\n", + "Train Epoch: 2 [56960/60000 (95%)]\tLoss: 1.067291\n", + "Train Epoch: 2 [57600/60000 (96%)]\tLoss: 1.102901\n", + "Train Epoch: 2 [58240/60000 (97%)]\tLoss: 1.082644\n", + "Train Epoch: 2 [58880/60000 (98%)]\tLoss: 1.176209\n", + "Train Epoch: 2 [59520/60000 (99%)]\tLoss: 1.100892\n", + "\n", + "Test set: Average loss: 0.9323\n", + "Class 0 accuracy: 937.0/980(96%)\n", + "Class 1 accuracy: 1083.0/1135(95%)\n", + "Class 2 accuracy: 748.0/1032(72%)\n", + "Class 3 accuracy: 923.0/1010(91%)\n", + "Class 4 accuracy: 826.0/982(84%)\n", + "Class 5 accuracy: 470.0/892(53%)\n", + "Class 6 accuracy: 886.0/958(92%)\n", + "Class 7 accuracy: 898.0/1028(87%)\n", + "Class 8 accuracy: 732.0/974(75%)\n", + "Class 9 accuracy: 844.0/1009(84%)\n", + "Train Epoch: 3 [0/60000 (0%)]\tLoss: 1.117987\n", + "Train Epoch: 3 [640/60000 (1%)]\tLoss: 1.044462\n", + "Train Epoch: 3 [1280/60000 (2%)]\tLoss: 1.027436\n", + "Train Epoch: 3 [1920/60000 (3%)]\tLoss: 1.230957\n", + "Train Epoch: 3 [2560/60000 (4%)]\tLoss: 1.004591\n", + "Train Epoch: 3 [3200/60000 (5%)]\tLoss: 1.060180\n", + "Train Epoch: 3 [3840/60000 (6%)]\tLoss: 0.902412\n", + "Train Epoch: 3 [4480/60000 (7%)]\tLoss: 0.957223\n", + "Train Epoch: 3 [5120/60000 (9%)]\tLoss: 1.091123\n", + "Train Epoch: 3 [5760/60000 (10%)]\tLoss: 1.175083\n", + "Train Epoch: 3 [6400/60000 (11%)]\tLoss: 0.969085\n", + "Train Epoch: 3 [7040/60000 (12%)]\tLoss: 1.044883\n", + "Train Epoch: 3 [7680/60000 (13%)]\tLoss: 1.010503\n", + "Train Epoch: 3 [8320/60000 (14%)]\tLoss: 1.037116\n", + "Train Epoch: 3 [8960/60000 (15%)]\tLoss: 0.968517\n", + "Train Epoch: 3 [9600/60000 (16%)]\tLoss: 1.037061\n", + "Train Epoch: 3 [10240/60000 (17%)]\tLoss: 0.992225\n", + "Train Epoch: 3 [10880/60000 (18%)]\tLoss: 1.091760\n", + "Train Epoch: 3 [11520/60000 (19%)]\tLoss: 1.100666\n", + "Train Epoch: 3 [12160/60000 (20%)]\tLoss: 0.852405\n", + "Train Epoch: 3 [12800/60000 (21%)]\tLoss: 0.957409\n", + "Train Epoch: 3 [13440/60000 (22%)]\tLoss: 0.959758\n", + "Train Epoch: 3 [14080/60000 (23%)]\tLoss: 0.998838\n", + "Train Epoch: 3 [14720/60000 (25%)]\tLoss: 1.045380\n", + "Train Epoch: 3 [15360/60000 (26%)]\tLoss: 0.842424\n", + "Train Epoch: 3 [16000/60000 (27%)]\tLoss: 1.003876\n", + "Train Epoch: 3 [16640/60000 (28%)]\tLoss: 0.948943\n", + "Train Epoch: 3 [17280/60000 (29%)]\tLoss: 1.090439\n", + "Train Epoch: 3 [17920/60000 (30%)]\tLoss: 1.087915\n", + "Train Epoch: 3 [18560/60000 (31%)]\tLoss: 1.145274\n", + "Train Epoch: 3 [19200/60000 (32%)]\tLoss: 1.217145\n", + "Train Epoch: 3 [19840/60000 (33%)]\tLoss: 1.085176\n", + "Train Epoch: 3 [20480/60000 (34%)]\tLoss: 1.083079\n", + "Train Epoch: 3 [21120/60000 (35%)]\tLoss: 0.999794\n", + "Train Epoch: 3 [21760/60000 (36%)]\tLoss: 0.911105\n", + "Train Epoch: 3 [22400/60000 (37%)]\tLoss: 1.273139\n", + "Train Epoch: 3 [23040/60000 (38%)]\tLoss: 1.048052\n", + "Train Epoch: 3 [23680/60000 (39%)]\tLoss: 0.818689\n", + "Train Epoch: 3 [24320/60000 (41%)]\tLoss: 0.858526\n", + "Train Epoch: 3 [24960/60000 (42%)]\tLoss: 0.982630\n", + "Train Epoch: 3 [25600/60000 (43%)]\tLoss: 1.042941\n", + "Train Epoch: 3 [26240/60000 (44%)]\tLoss: 0.818404\n", + "Train Epoch: 3 [26880/60000 (45%)]\tLoss: 0.947276\n", + "Train Epoch: 3 [27520/60000 (46%)]\tLoss: 0.990826\n", + "Train Epoch: 3 [28160/60000 (47%)]\tLoss: 0.956242\n", + "Train Epoch: 3 [28800/60000 (48%)]\tLoss: 1.052988\n", + "Train Epoch: 3 [29440/60000 (49%)]\tLoss: 1.157221\n", + "Train Epoch: 3 [30080/60000 (50%)]\tLoss: 0.913521\n", + "Train Epoch: 3 [30720/60000 (51%)]\tLoss: 1.009682\n", + "Train Epoch: 3 [31360/60000 (52%)]\tLoss: 0.770679\n", + "Train Epoch: 3 [32000/60000 (53%)]\tLoss: 0.990214\n", + "Train Epoch: 3 [32640/60000 (54%)]\tLoss: 0.937079\n", + "Train Epoch: 3 [33280/60000 (55%)]\tLoss: 0.872119\n", + "Train Epoch: 3 [33920/60000 (57%)]\tLoss: 0.840864\n", + "Train Epoch: 3 [34560/60000 (58%)]\tLoss: 1.002336\n", + "Train Epoch: 3 [35200/60000 (59%)]\tLoss: 0.915164\n", + "Train Epoch: 3 [35840/60000 (60%)]\tLoss: 1.012089\n", + "Train Epoch: 3 [36480/60000 (61%)]\tLoss: 0.939280\n", + "Train Epoch: 3 [37120/60000 (62%)]\tLoss: 1.060541\n", + "Train Epoch: 3 [37760/60000 (63%)]\tLoss: 0.937920\n", + "Train Epoch: 3 [38400/60000 (64%)]\tLoss: 1.006945\n", + "Train Epoch: 3 [39040/60000 (65%)]\tLoss: 1.078756\n", + "Train Epoch: 3 [39680/60000 (66%)]\tLoss: 1.017594\n", + "Train Epoch: 3 [40320/60000 (67%)]\tLoss: 1.033234\n", + "Train Epoch: 3 [40960/60000 (68%)]\tLoss: 1.230211\n", + "Train Epoch: 3 [41600/60000 (69%)]\tLoss: 0.684275\n", + "Train Epoch: 3 [42240/60000 (70%)]\tLoss: 1.083214\n", + "Train Epoch: 3 [42880/60000 (71%)]\tLoss: 0.852170\n", + "Train Epoch: 3 [43520/60000 (72%)]\tLoss: 0.995445\n", + "Train Epoch: 3 [44160/60000 (74%)]\tLoss: 0.790355\n", + "Train Epoch: 3 [44800/60000 (75%)]\tLoss: 0.920374\n", + "Train Epoch: 3 [45440/60000 (76%)]\tLoss: 1.090557\n", + "Train Epoch: 3 [46080/60000 (77%)]\tLoss: 0.755298\n", + "Train Epoch: 3 [46720/60000 (78%)]\tLoss: 1.101079\n", + "Train Epoch: 3 [47360/60000 (79%)]\tLoss: 0.719922\n", + "Train Epoch: 3 [48000/60000 (80%)]\tLoss: 0.805579\n", + "Train Epoch: 3 [48640/60000 (81%)]\tLoss: 0.866616\n", + "Train Epoch: 3 [49280/60000 (82%)]\tLoss: 0.777545\n", + "Train Epoch: 3 [49920/60000 (83%)]\tLoss: 0.800337\n", + "Train Epoch: 3 [50560/60000 (84%)]\tLoss: 0.921025\n", + "Train Epoch: 3 [51200/60000 (85%)]\tLoss: 0.961804\n", + "Train Epoch: 3 [51840/60000 (86%)]\tLoss: 0.882696\n", + "Train Epoch: 3 [52480/60000 (87%)]\tLoss: 0.849839\n", + "Train Epoch: 3 [53120/60000 (88%)]\tLoss: 0.893887\n", + "Train Epoch: 3 [53760/60000 (90%)]\tLoss: 0.815971\n", + "Train Epoch: 3 [54400/60000 (91%)]\tLoss: 1.109305\n", + "Train Epoch: 3 [55040/60000 (92%)]\tLoss: 0.864345\n", + "Train Epoch: 3 [55680/60000 (93%)]\tLoss: 0.969730\n", + "Train Epoch: 3 [56320/60000 (94%)]\tLoss: 0.959234\n", + "Train Epoch: 3 [56960/60000 (95%)]\tLoss: 0.954617\n", + "Train Epoch: 3 [57600/60000 (96%)]\tLoss: 0.790892\n", + "Train Epoch: 3 [58240/60000 (97%)]\tLoss: 1.002821\n", + "Train Epoch: 3 [58880/60000 (98%)]\tLoss: 0.799075\n", + "Train Epoch: 3 [59520/60000 (99%)]\tLoss: 0.859415\n", + "\n", + "Test set: Average loss: 0.7067\n", + "Class 0 accuracy: 942.0/980(96%)\n", + "Class 1 accuracy: 1085.0/1135(96%)\n", + "Class 2 accuracy: 815.0/1032(79%)\n", + "Class 3 accuracy: 909.0/1010(90%)\n", + "Class 4 accuracy: 844.0/982(86%)\n", + "Class 5 accuracy: 572.0/892(64%)\n", + "Class 6 accuracy: 881.0/958(92%)\n", + "Class 7 accuracy: 895.0/1028(87%)\n", + "Class 8 accuracy: 773.0/974(79%)\n", + "Class 9 accuracy: 861.0/1009(85%)\n", + "Train Epoch: 4 [0/60000 (0%)]\tLoss: 0.921860\n", + "Train Epoch: 4 [640/60000 (1%)]\tLoss: 1.006901\n", + "Train Epoch: 4 [1280/60000 (2%)]\tLoss: 0.829744\n", + "Train Epoch: 4 [1920/60000 (3%)]\tLoss: 0.958730\n", + "Train Epoch: 4 [2560/60000 (4%)]\tLoss: 0.908768\n", + "Train Epoch: 4 [3200/60000 (5%)]\tLoss: 0.809689\n", + "Train Epoch: 4 [3840/60000 (6%)]\tLoss: 0.864438\n", + "Train Epoch: 4 [4480/60000 (7%)]\tLoss: 0.871907\n", + "Train Epoch: 4 [5120/60000 (9%)]\tLoss: 0.879927\n", + "Train Epoch: 4 [5760/60000 (10%)]\tLoss: 0.958960\n", + "Train Epoch: 4 [6400/60000 (11%)]\tLoss: 0.866098\n", + "Train Epoch: 4 [7040/60000 (12%)]\tLoss: 1.041393\n", + "Train Epoch: 4 [7680/60000 (13%)]\tLoss: 0.813019\n", + "Train Epoch: 4 [8320/60000 (14%)]\tLoss: 0.767784\n", + "Train Epoch: 4 [8960/60000 (15%)]\tLoss: 0.933339\n", + "Train Epoch: 4 [9600/60000 (16%)]\tLoss: 0.821877\n", + "Train Epoch: 4 [10240/60000 (17%)]\tLoss: 0.826119\n", + "Train Epoch: 4 [10880/60000 (18%)]\tLoss: 0.772280\n", + "Train Epoch: 4 [11520/60000 (19%)]\tLoss: 0.868618\n", + "Train Epoch: 4 [12160/60000 (20%)]\tLoss: 1.034466\n", + "Train Epoch: 4 [12800/60000 (21%)]\tLoss: 0.872086\n", + "Train Epoch: 4 [13440/60000 (22%)]\tLoss: 0.912373\n", + "Train Epoch: 4 [14080/60000 (23%)]\tLoss: 0.870299\n", + "Train Epoch: 4 [14720/60000 (25%)]\tLoss: 0.731594\n", + "Train Epoch: 4 [15360/60000 (26%)]\tLoss: 1.079396\n", + "Train Epoch: 4 [16000/60000 (27%)]\tLoss: 0.882126\n", + "Train Epoch: 4 [16640/60000 (28%)]\tLoss: 0.682331\n", + "Train Epoch: 4 [17280/60000 (29%)]\tLoss: 1.029123\n", + "Train Epoch: 4 [17920/60000 (30%)]\tLoss: 0.596465\n", + "Train Epoch: 4 [18560/60000 (31%)]\tLoss: 0.813218\n", + "Train Epoch: 4 [19200/60000 (32%)]\tLoss: 0.747696\n", + "Train Epoch: 4 [19840/60000 (33%)]\tLoss: 0.880849\n", + "Train Epoch: 4 [20480/60000 (34%)]\tLoss: 0.734443\n", + "Train Epoch: 4 [21120/60000 (35%)]\tLoss: 0.840509\n", + "Train Epoch: 4 [21760/60000 (36%)]\tLoss: 0.745489\n", + "Train Epoch: 4 [22400/60000 (37%)]\tLoss: 0.841733\n", + "Train Epoch: 4 [23040/60000 (38%)]\tLoss: 0.920951\n", + "Train Epoch: 4 [23680/60000 (39%)]\tLoss: 0.924071\n", + "Train Epoch: 4 [24320/60000 (41%)]\tLoss: 0.906279\n", + "Train Epoch: 4 [24960/60000 (42%)]\tLoss: 0.867031\n", + "Train Epoch: 4 [25600/60000 (43%)]\tLoss: 0.946203\n", + "Train Epoch: 4 [26240/60000 (44%)]\tLoss: 0.989663\n", + "Train Epoch: 4 [26880/60000 (45%)]\tLoss: 0.839466\n", + "Train Epoch: 4 [27520/60000 (46%)]\tLoss: 0.843587\n", + "Train Epoch: 4 [28160/60000 (47%)]\tLoss: 0.737129\n", + "Train Epoch: 4 [28800/60000 (48%)]\tLoss: 0.807360\n", + "Train Epoch: 4 [29440/60000 (49%)]\tLoss: 0.823521\n", + "Train Epoch: 4 [30080/60000 (50%)]\tLoss: 0.841337\n", + "Train Epoch: 4 [30720/60000 (51%)]\tLoss: 0.999043\n", + "Train Epoch: 4 [31360/60000 (52%)]\tLoss: 0.962988\n", + "Train Epoch: 4 [32000/60000 (53%)]\tLoss: 1.040999\n", + "Train Epoch: 4 [32640/60000 (54%)]\tLoss: 0.750595\n", + "Train Epoch: 4 [33280/60000 (55%)]\tLoss: 0.904500\n", + "Train Epoch: 4 [33920/60000 (57%)]\tLoss: 0.716458\n", + "Train Epoch: 4 [34560/60000 (58%)]\tLoss: 0.917832\n", + "Train Epoch: 4 [35200/60000 (59%)]\tLoss: 0.834955\n", + "Train Epoch: 4 [35840/60000 (60%)]\tLoss: 0.833779\n", + "Train Epoch: 4 [36480/60000 (61%)]\tLoss: 0.798480\n", + "Train Epoch: 4 [37120/60000 (62%)]\tLoss: 0.718178\n", + "Train Epoch: 4 [37760/60000 (63%)]\tLoss: 0.774633\n", + "Train Epoch: 4 [38400/60000 (64%)]\tLoss: 0.640932\n", + "Train Epoch: 4 [39040/60000 (65%)]\tLoss: 0.761126\n", + "Train Epoch: 4 [39680/60000 (66%)]\tLoss: 0.567800\n", + "Train Epoch: 4 [40320/60000 (67%)]\tLoss: 0.731927\n", + "Train Epoch: 4 [40960/60000 (68%)]\tLoss: 0.972790\n", + "Train Epoch: 4 [41600/60000 (69%)]\tLoss: 0.913961\n", + "Train Epoch: 4 [42240/60000 (70%)]\tLoss: 0.630956\n", + "Train Epoch: 4 [42880/60000 (71%)]\tLoss: 0.928092\n", + "Train Epoch: 4 [43520/60000 (72%)]\tLoss: 0.749575\n", + "Train Epoch: 4 [44160/60000 (74%)]\tLoss: 0.970667\n", + "Train Epoch: 4 [44800/60000 (75%)]\tLoss: 0.804512\n", + "Train Epoch: 4 [45440/60000 (76%)]\tLoss: 0.832241\n", + "Train Epoch: 4 [46080/60000 (77%)]\tLoss: 0.851197\n", + "Train Epoch: 4 [46720/60000 (78%)]\tLoss: 0.918072\n", + "Train Epoch: 4 [47360/60000 (79%)]\tLoss: 0.886158\n", + "Train Epoch: 4 [48000/60000 (80%)]\tLoss: 0.803933\n", + "Train Epoch: 4 [48640/60000 (81%)]\tLoss: 0.711099\n", + "Train Epoch: 4 [49280/60000 (82%)]\tLoss: 0.786826\n", + "Train Epoch: 4 [49920/60000 (83%)]\tLoss: 0.834988\n", + "Train Epoch: 4 [50560/60000 (84%)]\tLoss: 0.902848\n", + "Train Epoch: 4 [51200/60000 (85%)]\tLoss: 0.838035\n", + "Train Epoch: 4 [51840/60000 (86%)]\tLoss: 0.853425\n", + "Train Epoch: 4 [52480/60000 (87%)]\tLoss: 0.843906\n", + "Train Epoch: 4 [53120/60000 (88%)]\tLoss: 0.782411\n", + "Train Epoch: 4 [53760/60000 (90%)]\tLoss: 0.752052\n", + "Train Epoch: 4 [54400/60000 (91%)]\tLoss: 0.738311\n", + "Train Epoch: 4 [55040/60000 (92%)]\tLoss: 0.929952\n", + "Train Epoch: 4 [55680/60000 (93%)]\tLoss: 0.858274\n", + "Train Epoch: 4 [56320/60000 (94%)]\tLoss: 1.006905\n", + "Train Epoch: 4 [56960/60000 (95%)]\tLoss: 0.824607\n", + "Train Epoch: 4 [57600/60000 (96%)]\tLoss: 0.852737\n", + "Train Epoch: 4 [58240/60000 (97%)]\tLoss: 0.789701\n", + "Train Epoch: 4 [58880/60000 (98%)]\tLoss: 0.821994\n", + "Train Epoch: 4 [59520/60000 (99%)]\tLoss: 0.840377\n", + "\n", + "Test set: Average loss: 0.6137\n", + "Class 0 accuracy: 947.0/980(97%)\n", + "Class 1 accuracy: 1097.0/1135(97%)\n", + "Class 2 accuracy: 840.0/1032(81%)\n", + "Class 3 accuracy: 912.0/1010(90%)\n", + "Class 4 accuracy: 852.0/982(87%)\n", + "Class 5 accuracy: 602.0/892(67%)\n", + "Class 6 accuracy: 879.0/958(92%)\n", + "Class 7 accuracy: 904.0/1028(88%)\n", + "Class 8 accuracy: 770.0/974(79%)\n", + "Class 9 accuracy: 866.0/1009(86%)\n", + "Train Epoch: 5 [0/60000 (0%)]\tLoss: 0.841241\n", + "Train Epoch: 5 [640/60000 (1%)]\tLoss: 0.963371\n", + "Train Epoch: 5 [1280/60000 (2%)]\tLoss: 0.714024\n", + "Train Epoch: 5 [1920/60000 (3%)]\tLoss: 0.760713\n", + "Train Epoch: 5 [2560/60000 (4%)]\tLoss: 0.709700\n", + "Train Epoch: 5 [3200/60000 (5%)]\tLoss: 0.959411\n", + "Train Epoch: 5 [3840/60000 (6%)]\tLoss: 0.823688\n", + "Train Epoch: 5 [4480/60000 (7%)]\tLoss: 0.688386\n", + "Train Epoch: 5 [5120/60000 (9%)]\tLoss: 0.836027\n", + "Train Epoch: 5 [5760/60000 (10%)]\tLoss: 0.814876\n", + "Train Epoch: 5 [6400/60000 (11%)]\tLoss: 0.915517\n", + "Train Epoch: 5 [7040/60000 (12%)]\tLoss: 0.930052\n", + "Train Epoch: 5 [7680/60000 (13%)]\tLoss: 0.713963\n", + "Train Epoch: 5 [8320/60000 (14%)]\tLoss: 0.611171\n", + "Train Epoch: 5 [8960/60000 (15%)]\tLoss: 0.753952\n", + "Train Epoch: 5 [9600/60000 (16%)]\tLoss: 0.753516\n", + "Train Epoch: 5 [10240/60000 (17%)]\tLoss: 0.638662\n", + "Train Epoch: 5 [10880/60000 (18%)]\tLoss: 0.851477\n", + "Train Epoch: 5 [11520/60000 (19%)]\tLoss: 0.748764\n", + "Train Epoch: 5 [12160/60000 (20%)]\tLoss: 0.717946\n", + "Train Epoch: 5 [12800/60000 (21%)]\tLoss: 0.648801\n", + "Train Epoch: 5 [13440/60000 (22%)]\tLoss: 0.817798\n", + "Train Epoch: 5 [14080/60000 (23%)]\tLoss: 1.011557\n", + "Train Epoch: 5 [14720/60000 (25%)]\tLoss: 0.979450\n", + "Train Epoch: 5 [15360/60000 (26%)]\tLoss: 0.741829\n", + "Train Epoch: 5 [16000/60000 (27%)]\tLoss: 0.929305\n", + "Train Epoch: 5 [16640/60000 (28%)]\tLoss: 0.898180\n", + "Train Epoch: 5 [17280/60000 (29%)]\tLoss: 0.682718\n", + "Train Epoch: 5 [17920/60000 (30%)]\tLoss: 0.841480\n", + "Train Epoch: 5 [18560/60000 (31%)]\tLoss: 0.895796\n", + "Train Epoch: 5 [19200/60000 (32%)]\tLoss: 0.707863\n", + "Train Epoch: 5 [19840/60000 (33%)]\tLoss: 0.851275\n", + "Train Epoch: 5 [20480/60000 (34%)]\tLoss: 0.855291\n", + "Train Epoch: 5 [21120/60000 (35%)]\tLoss: 0.851695\n", + "Train Epoch: 5 [21760/60000 (36%)]\tLoss: 0.684048\n", + "Train Epoch: 5 [22400/60000 (37%)]\tLoss: 0.917995\n", + "Train Epoch: 5 [23040/60000 (38%)]\tLoss: 0.765770\n", + "Train Epoch: 5 [23680/60000 (39%)]\tLoss: 0.647655\n", + "Train Epoch: 5 [24320/60000 (41%)]\tLoss: 0.739678\n", + "Train Epoch: 5 [24960/60000 (42%)]\tLoss: 0.672344\n", + "Train Epoch: 5 [25600/60000 (43%)]\tLoss: 0.766927\n", + "Train Epoch: 5 [26240/60000 (44%)]\tLoss: 0.738036\n", + "Train Epoch: 5 [26880/60000 (45%)]\tLoss: 0.852725\n", + "Train Epoch: 5 [27520/60000 (46%)]\tLoss: 0.632756\n", + "Train Epoch: 5 [28160/60000 (47%)]\tLoss: 0.689774\n", + "Train Epoch: 5 [28800/60000 (48%)]\tLoss: 0.674076\n", + "Train Epoch: 5 [29440/60000 (49%)]\tLoss: 0.755838\n", + "Train Epoch: 5 [30080/60000 (50%)]\tLoss: 0.786167\n", + "Train Epoch: 5 [30720/60000 (51%)]\tLoss: 0.804736\n", + "Train Epoch: 5 [31360/60000 (52%)]\tLoss: 0.723398\n", + "Train Epoch: 5 [32000/60000 (53%)]\tLoss: 0.685933\n", + "Train Epoch: 5 [32640/60000 (54%)]\tLoss: 0.808149\n", + "Train Epoch: 5 [33280/60000 (55%)]\tLoss: 0.944384\n", + "Train Epoch: 5 [33920/60000 (57%)]\tLoss: 0.638669\n", + "Train Epoch: 5 [34560/60000 (58%)]\tLoss: 0.683750\n", + "Train Epoch: 5 [35200/60000 (59%)]\tLoss: 0.702595\n", + "Train Epoch: 5 [35840/60000 (60%)]\tLoss: 0.742202\n", + "Train Epoch: 5 [36480/60000 (61%)]\tLoss: 0.761243\n", + "Train Epoch: 5 [37120/60000 (62%)]\tLoss: 0.768657\n", + "Train Epoch: 5 [37760/60000 (63%)]\tLoss: 0.824368\n", + "Train Epoch: 5 [38400/60000 (64%)]\tLoss: 0.657427\n", + "Train Epoch: 5 [39040/60000 (65%)]\tLoss: 0.724466\n", + "Train Epoch: 5 [39680/60000 (66%)]\tLoss: 0.800387\n", + "Train Epoch: 5 [40320/60000 (67%)]\tLoss: 0.812061\n", + "Train Epoch: 5 [40960/60000 (68%)]\tLoss: 0.811920\n", + "Train Epoch: 5 [41600/60000 (69%)]\tLoss: 0.888286\n", + "Train Epoch: 5 [42240/60000 (70%)]\tLoss: 0.691121\n", + "Train Epoch: 5 [42880/60000 (71%)]\tLoss: 0.749742\n", + "Train Epoch: 5 [43520/60000 (72%)]\tLoss: 0.944218\n", + "Train Epoch: 5 [44160/60000 (74%)]\tLoss: 0.698245\n", + "Train Epoch: 5 [44800/60000 (75%)]\tLoss: 0.796792\n", + "Train Epoch: 5 [45440/60000 (76%)]\tLoss: 0.653151\n", + "Train Epoch: 5 [46080/60000 (77%)]\tLoss: 0.813349\n", + "Train Epoch: 5 [46720/60000 (78%)]\tLoss: 0.600790\n", + "Train Epoch: 5 [47360/60000 (79%)]\tLoss: 0.848091\n", + "Train Epoch: 5 [48000/60000 (80%)]\tLoss: 0.636887\n", + "Train Epoch: 5 [48640/60000 (81%)]\tLoss: 0.767468\n", + "Train Epoch: 5 [49280/60000 (82%)]\tLoss: 0.713464\n", + "Train Epoch: 5 [49920/60000 (83%)]\tLoss: 0.635464\n", + "Train Epoch: 5 [50560/60000 (84%)]\tLoss: 0.722847\n", + "Train Epoch: 5 [51200/60000 (85%)]\tLoss: 0.924447\n", + "Train Epoch: 5 [51840/60000 (86%)]\tLoss: 0.738732\n", + "Train Epoch: 5 [52480/60000 (87%)]\tLoss: 0.732151\n", + "Train Epoch: 5 [53120/60000 (88%)]\tLoss: 0.769458\n", + "Train Epoch: 5 [53760/60000 (90%)]\tLoss: 0.761817\n", + "Train Epoch: 5 [54400/60000 (91%)]\tLoss: 0.766024\n", + "Train Epoch: 5 [55040/60000 (92%)]\tLoss: 0.820377\n", + "Train Epoch: 5 [55680/60000 (93%)]\tLoss: 0.713448\n", + "Train Epoch: 5 [56320/60000 (94%)]\tLoss: 0.753411\n", + "Train Epoch: 5 [56960/60000 (95%)]\tLoss: 0.758932\n", + "Train Epoch: 5 [57600/60000 (96%)]\tLoss: 0.690840\n", + "Train Epoch: 5 [58240/60000 (97%)]\tLoss: 0.855213\n", + "Train Epoch: 5 [58880/60000 (98%)]\tLoss: 0.847026\n", + "Train Epoch: 5 [59520/60000 (99%)]\tLoss: 0.714162\n", + "\n", + "Test set: Average loss: 0.5663\n", + "Class 0 accuracy: 949.0/980(97%)\n", + "Class 1 accuracy: 1095.0/1135(96%)\n", + "Class 2 accuracy: 841.0/1032(81%)\n", + "Class 3 accuracy: 909.0/1010(90%)\n", + "Class 4 accuracy: 861.0/982(88%)\n", + "Class 5 accuracy: 630.0/892(71%)\n", + "Class 6 accuracy: 881.0/958(92%)\n", + "Class 7 accuracy: 906.0/1028(88%)\n", + "Class 8 accuracy: 798.0/974(82%)\n", + "Class 9 accuracy: 869.0/1009(86%)\n" + ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "[{0: 0.9612244897959183,\n", + " 1: 0.9242290748898678,\n", + " 2: 0.5135658914728682,\n", + " 3: 0.9188118811881189,\n", + " 4: 0.7606924643584522,\n", + " 5: 0.3352017937219731,\n", + " 6: 0.918580375782881,\n", + " 7: 0.8278210116731517,\n", + " 8: 0.7638603696098563,\n", + " 9: 0.7809712586719524,\n", + " 'phase': 'baseline'},\n", + " {0: 0.9561224489795919,\n", + " 1: 0.9541850220264317,\n", + " 2: 0.7248062015503876,\n", + " 3: 0.9138613861386139,\n", + " 4: 0.8411405295315683,\n", + " 5: 0.5269058295964125,\n", + " 6: 0.9248434237995825,\n", + " 7: 0.8735408560311284,\n", + " 8: 0.7515400410677618,\n", + " 9: 0.8364717542120912,\n", + " 'phase': 'baseline'},\n", + " {0: 0.9612244897959183,\n", + " 1: 0.9559471365638766,\n", + " 2: 0.7897286821705426,\n", + " 3: 0.9,\n", + " 4: 0.8594704684317719,\n", + " 5: 0.6412556053811659,\n", + " 6: 0.9196242171189979,\n", + " 7: 0.8706225680933852,\n", + " 8: 0.7936344969199178,\n", + " 9: 0.8533201189296333,\n", + " 'phase': 'baseline'},\n", + " {0: 0.9663265306122449,\n", + " 1: 0.9665198237885463,\n", + " 2: 0.813953488372093,\n", + " 3: 0.902970297029703,\n", + " 4: 0.8676171079429735,\n", + " 5: 0.6748878923766816,\n", + " 6: 0.9175365344467641,\n", + " 7: 0.8793774319066148,\n", + " 8: 0.7905544147843943,\n", + " 9: 0.8582755203171457,\n", + " 'phase': 'baseline'},\n", + " {0: 0.9683673469387755,\n", + " 1: 0.9647577092511013,\n", + " 2: 0.814922480620155,\n", + " 3: 0.9,\n", + " 4: 0.8767820773930753,\n", + " 5: 0.7062780269058296,\n", + " 6: 0.9196242171189979,\n", + " 7: 0.8813229571984436,\n", + " 8: 0.8193018480492813,\n", + " 9: 0.8612487611496531,\n", + " 'phase': 'baseline'}]" + ] + }, + "metadata": {}, + "execution_count": 14 + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Exercise 1: Implement an experiment setup that measures catastrophic forgetting while\n", + "# training in a task-incremental way on digits (0,1), (2,3), ..., (8, 9). After finishing\n", + "# training, measure the performance on the first task again.\n", + "#\n", + "# Implementation requires to fill in code further up in this notebook. You can visualize\n", + "# the result using the code further below.\n", + "\n", + "### START SOLUTION ###\n", + "# In this first part, we implement an experiment setup to measure catastrophic forgetting.\n", + "# We will subsequently train on pairs of classes, (0,1), then (2,3), etc., and in the end\n", + "# revisit the first task to measure if there was any forward transfer while training on the\n", + "# other tasks.\n", + "\n", + "def train_catastrophic_forgetting():\n", + " model = Net()\n", + " history = []\n", + "\n", + " config.train_classes = [0, 1]\n", + " train_model(config, model, phase = \"0_1\", history = history)\n", + " \n", + " config.train_classes = [2, 3]\n", + " train_model(config, model, phase = \"2_3\", history = history)\n", + "\n", + " config.train_classes = [4, 5]\n", + " train_model(config, model, phase = \"4_5\", history = history)\n", + "\n", + " config.train_classes = [6, 7]\n", + " train_model(config, model, phase = \"6_7\", history = history)\n", + "\n", + " config.train_classes = [8, 9]\n", + " train_model(config, model, phase = \"8_9\", history = history)\n", + " \n", + " config.train_classes = [0, 1]\n", + " train_model(config, model, phase = \"0_1_again\", history = history)\n", + "\n", + " return history\n", + "\n", + "### END SOLUTION ###\n", + " \n", + "history_catastrophic_forgetting = train_catastrophic_forgetting()\n", + "history_catastrophic_forgetting" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "OnATcaveP3Fi", + "outputId": "3864a59d-b604-491d-8697-f4f7d622c1e7" + }, + "execution_count": 15, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.311233\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 2.246531\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 2.186137\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 2.105181\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 2.048626\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 1.975536\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 1.913516\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 1.818088\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.744223\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.696749\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.615581\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.508412\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 1.426383\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 1.385702\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 1.271088\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 1.157527\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 1.164531\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 1.056471\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 1.015163\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.924486\n", + "\n", + "Test set: Average loss: 2.6919\n", + "Class 0 accuracy: 972.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.725303\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.845168\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.872068\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.699184\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.702631\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.649261\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.638805\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.584503\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.612078\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.522527\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.505232\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.500317\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.420275\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.444307\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.431154\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.426933\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.428767\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.397589\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.332724\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.391286\n", + "\n", + "Test set: Average loss: 3.6493\n", + "Class 0 accuracy: 970.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.367619\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.309399\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.296202\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.340773\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.293039\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.288575\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.285356\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.283475\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.285720\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.245976\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.249808\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.239022\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.268774\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.223297\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.236870\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.222967\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.242883\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.208523\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.191585\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.206234\n", + "\n", + "Test set: Average loss: 4.2921\n", + "Class 0 accuracy: 971.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.222183\n", + "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.175392\n", + "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.230008\n", + "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.246189\n", + "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.224284\n", + "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.172705\n", + "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.188962\n", + "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.212664\n", + "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.197847\n", + "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.161129\n", + "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.160840\n", + "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.193788\n", + "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.150140\n", + "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.193050\n", + "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.173765\n", + "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.170651\n", + "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.170728\n", + "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.179045\n", + "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.156496\n", + "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.174930\n", + "\n", + "Test set: Average loss: 4.6719\n", + "Class 0 accuracy: 972.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.150109\n", + "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.133148\n", + "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.143406\n", + "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.210281\n", + "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.129901\n", + "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.140156\n", + "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.127928\n", + "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.153185\n", + "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.132688\n", + "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.174982\n", + "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.174245\n", + "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.147878\n", + "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.105936\n", + "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.139824\n", + "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.128497\n", + "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.102555\n", + "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.149713\n", + "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.204445\n", + "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.173781\n", + "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.104449\n", + "\n", + "Test set: Average loss: 4.9040\n", + "Class 0 accuracy: 972.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/12089 (0%)]\tLoss: 7.002198\n", + "Train Epoch: 1 [640/12089 (5%)]\tLoss: 6.786501\n", + "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 6.051014\n", + "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 6.422165\n", + "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 5.702563\n", + "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 5.380751\n", + "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 4.846919\n", + "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 4.511275\n", + "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 4.290347\n", + "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 3.839983\n", + "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 3.078847\n", + "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 2.839584\n", + "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 2.448348\n", + "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 2.193519\n", + "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 1.988640\n", + "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 1.651685\n", + "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 1.662965\n", + "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 1.390365\n", + "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 1.214716\n", + "\n", + "Test set: Average loss: 2.9396\n", + "Class 0 accuracy: 554.0/980(57%)\n", + "Class 1 accuracy: 1033.0/1135(91%)\n", + "Class 2 accuracy: 387.0/1032(38%)\n", + "Class 3 accuracy: 1008.0/1010(100%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12089 (0%)]\tLoss: 1.242918\n", + "Train Epoch: 2 [640/12089 (5%)]\tLoss: 1.003339\n", + "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 0.984789\n", + "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.937961\n", + "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.883540\n", + "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.840368\n", + "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 0.937714\n", + "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.909657\n", + "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.840488\n", + "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.763511\n", + "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.767492\n", + "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.721862\n", + "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 0.698475\n", + "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.630833\n", + "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.732636\n", + "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.686765\n", + "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.647560\n", + "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.584798\n", + "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.605022\n", + "\n", + "Test set: Average loss: 3.8344\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 889.0/1032(86%)\n", + "Class 3 accuracy: 985.0/1010(98%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.633021\n", + "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.661086\n", + "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.531795\n", + "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.595388\n", + "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.484488\n", + "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.610725\n", + "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.539676\n", + "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.555348\n", + "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.475156\n", + "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.532515\n", + "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.561437\n", + "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.513701\n", + "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.469366\n", + "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.517332\n", + "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.443565\n", + "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.427636\n", + "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.427255\n", + "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.556653\n", + "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.481399\n", + "\n", + "Test set: Average loss: 4.3145\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 945.0/1032(92%)\n", + "Class 3 accuracy: 967.0/1010(96%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12089 (0%)]\tLoss: 0.505337\n", + "Train Epoch: 4 [640/12089 (5%)]\tLoss: 0.464085\n", + "Train Epoch: 4 [1280/12089 (11%)]\tLoss: 0.518291\n", + "Train Epoch: 4 [1920/12089 (16%)]\tLoss: 0.452366\n", + "Train Epoch: 4 [2560/12089 (21%)]\tLoss: 0.405918\n", + "Train Epoch: 4 [3200/12089 (26%)]\tLoss: 0.502257\n", + "Train Epoch: 4 [3840/12089 (32%)]\tLoss: 0.448973\n", + "Train Epoch: 4 [4480/12089 (37%)]\tLoss: 0.445046\n", + "Train Epoch: 4 [5120/12089 (42%)]\tLoss: 0.495061\n", + "Train Epoch: 4 [5760/12089 (48%)]\tLoss: 0.456786\n", + "Train Epoch: 4 [6400/12089 (53%)]\tLoss: 0.371738\n", + "Train Epoch: 4 [7040/12089 (58%)]\tLoss: 0.468638\n", + "Train Epoch: 4 [7680/12089 (63%)]\tLoss: 0.495899\n", + "Train Epoch: 4 [8320/12089 (69%)]\tLoss: 0.453645\n", + "Train Epoch: 4 [8960/12089 (74%)]\tLoss: 0.479238\n", + "Train Epoch: 4 [9600/12089 (79%)]\tLoss: 0.458163\n", + "Train Epoch: 4 [10240/12089 (85%)]\tLoss: 0.446410\n", + "Train Epoch: 4 [10880/12089 (90%)]\tLoss: 0.441910\n", + "Train Epoch: 4 [11520/12089 (95%)]\tLoss: 0.430284\n", + "\n", + "Test set: Average loss: 4.5708\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 952.0/1032(92%)\n", + "Class 3 accuracy: 969.0/1010(96%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12089 (0%)]\tLoss: 0.405303\n", + "Train Epoch: 5 [640/12089 (5%)]\tLoss: 0.396980\n", + "Train Epoch: 5 [1280/12089 (11%)]\tLoss: 0.421218\n", + "Train Epoch: 5 [1920/12089 (16%)]\tLoss: 0.459768\n", + "Train Epoch: 5 [2560/12089 (21%)]\tLoss: 0.354826\n", + "Train Epoch: 5 [3200/12089 (26%)]\tLoss: 0.372944\n", + "Train Epoch: 5 [3840/12089 (32%)]\tLoss: 0.394097\n", + "Train Epoch: 5 [4480/12089 (37%)]\tLoss: 0.444731\n", + "Train Epoch: 5 [5120/12089 (42%)]\tLoss: 0.470775\n", + "Train Epoch: 5 [5760/12089 (48%)]\tLoss: 0.414834\n", + "Train Epoch: 5 [6400/12089 (53%)]\tLoss: 0.451856\n", + "Train Epoch: 5 [7040/12089 (58%)]\tLoss: 0.390931\n", + "Train Epoch: 5 [7680/12089 (63%)]\tLoss: 0.392495\n", + "Train Epoch: 5 [8320/12089 (69%)]\tLoss: 0.341354\n", + "Train Epoch: 5 [8960/12089 (74%)]\tLoss: 0.355052\n", + "Train Epoch: 5 [9600/12089 (79%)]\tLoss: 0.414375\n", + "Train Epoch: 5 [10240/12089 (85%)]\tLoss: 0.419718\n", + "Train Epoch: 5 [10880/12089 (90%)]\tLoss: 0.367832\n", + "Train Epoch: 5 [11520/12089 (95%)]\tLoss: 0.358470\n", + "\n", + "Test set: Average loss: 4.7194\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 953.0/1032(92%)\n", + "Class 3 accuracy: 970.0/1010(96%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/11263 (0%)]\tLoss: 6.261249\n", + "Train Epoch: 1 [640/11263 (6%)]\tLoss: 5.999681\n", + "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 5.607321\n", + "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 5.542882\n", + "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 4.963273\n", + "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 4.750457\n", + "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 4.334918\n", + "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 3.912877\n", + "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 3.827431\n", + "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 3.393839\n", + "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 3.033727\n", + "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 2.671916\n", + "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 2.473807\n", + "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 2.285081\n", + "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 1.972579\n", + "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 1.953343\n", + "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 1.653112\n", + "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 1.666049\n", + "\n", + "Test set: Average loss: 2.6135\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 242.0/1135(21%)\n", + "Class 2 accuracy: 341.0/1032(33%)\n", + "Class 3 accuracy: 431.0/1010(43%)\n", + "Class 4 accuracy: 982.0/982(100%)\n", + "Class 5 accuracy: 11.0/892(1%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/11263 (0%)]\tLoss: 1.265681\n", + "Train Epoch: 2 [640/11263 (6%)]\tLoss: 1.242094\n", + "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 1.308110\n", + "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 1.304853\n", + "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 1.242684\n", + "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 1.155575\n", + "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 1.025319\n", + "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 1.151237\n", + "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 1.071076\n", + "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 0.978908\n", + "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.869457\n", + "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.841398\n", + "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.893406\n", + "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.835585\n", + "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.868128\n", + "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.763401\n", + "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.905359\n", + "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.842730\n", + "\n", + "Test set: Average loss: 3.4385\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 979.0/982(100%)\n", + "Class 5 accuracy: 808.0/892(91%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.688606\n", + "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.747074\n", + "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.699562\n", + "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.687192\n", + "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.694984\n", + "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.643804\n", + "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.637270\n", + "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.776547\n", + "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.624326\n", + "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.763693\n", + "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.619411\n", + "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.672091\n", + "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.640160\n", + "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.594804\n", + "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.712096\n", + "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.584561\n", + "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.490905\n", + "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.511629\n", + "\n", + "Test set: Average loss: 3.9981\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 975.0/982(99%)\n", + "Class 5 accuracy: 837.0/892(94%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/11263 (0%)]\tLoss: 0.560350\n", + "Train Epoch: 4 [640/11263 (6%)]\tLoss: 0.549644\n", + "Train Epoch: 4 [1280/11263 (11%)]\tLoss: 0.548100\n", + "Train Epoch: 4 [1920/11263 (17%)]\tLoss: 0.523234\n", + "Train Epoch: 4 [2560/11263 (23%)]\tLoss: 0.563891\n", + "Train Epoch: 4 [3200/11263 (28%)]\tLoss: 0.462694\n", + "Train Epoch: 4 [3840/11263 (34%)]\tLoss: 0.562608\n", + "Train Epoch: 4 [4480/11263 (40%)]\tLoss: 0.446004\n", + "Train Epoch: 4 [5120/11263 (45%)]\tLoss: 0.511273\n", + "Train Epoch: 4 [5760/11263 (51%)]\tLoss: 0.548768\n", + "Train Epoch: 4 [6400/11263 (57%)]\tLoss: 0.529422\n", + "Train Epoch: 4 [7040/11263 (62%)]\tLoss: 0.544079\n", + "Train Epoch: 4 [7680/11263 (68%)]\tLoss: 0.428724\n", + "Train Epoch: 4 [8320/11263 (74%)]\tLoss: 0.600822\n", + "Train Epoch: 4 [8960/11263 (80%)]\tLoss: 0.474362\n", + "Train Epoch: 4 [9600/11263 (85%)]\tLoss: 0.595750\n", + "Train Epoch: 4 [10240/11263 (91%)]\tLoss: 0.544630\n", + "Train Epoch: 4 [10880/11263 (97%)]\tLoss: 0.506346\n", + "\n", + "Test set: Average loss: 4.3219\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 974.0/982(99%)\n", + "Class 5 accuracy: 841.0/892(94%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/11263 (0%)]\tLoss: 0.355252\n", + "Train Epoch: 5 [640/11263 (6%)]\tLoss: 0.517941\n", + "Train Epoch: 5 [1280/11263 (11%)]\tLoss: 0.526465\n", + "Train Epoch: 5 [1920/11263 (17%)]\tLoss: 0.523074\n", + "Train Epoch: 5 [2560/11263 (23%)]\tLoss: 0.433639\n", + "Train Epoch: 5 [3200/11263 (28%)]\tLoss: 0.434077\n", + "Train Epoch: 5 [3840/11263 (34%)]\tLoss: 0.403323\n", + "Train Epoch: 5 [4480/11263 (40%)]\tLoss: 0.505131\n", + "Train Epoch: 5 [5120/11263 (45%)]\tLoss: 0.355989\n", + "Train Epoch: 5 [5760/11263 (51%)]\tLoss: 0.490564\n", + "Train Epoch: 5 [6400/11263 (57%)]\tLoss: 0.399952\n", + "Train Epoch: 5 [7040/11263 (62%)]\tLoss: 0.436878\n", + "Train Epoch: 5 [7680/11263 (68%)]\tLoss: 0.491910\n", + "Train Epoch: 5 [8320/11263 (74%)]\tLoss: 0.429957\n", + "Train Epoch: 5 [8960/11263 (80%)]\tLoss: 0.495502\n", + "Train Epoch: 5 [9600/11263 (85%)]\tLoss: 0.446051\n", + "Train Epoch: 5 [10240/11263 (91%)]\tLoss: 0.364511\n", + "Train Epoch: 5 [10880/11263 (97%)]\tLoss: 0.447680\n", + "\n", + "Test set: Average loss: 4.5150\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 974.0/982(99%)\n", + "Class 5 accuracy: 843.0/892(95%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/12183 (0%)]\tLoss: 7.209232\n", + "Train Epoch: 1 [640/12183 (5%)]\tLoss: 7.299924\n", + "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 6.381386\n", + "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 6.263927\n", + "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 5.731481\n", + "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 5.564906\n", + "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 4.826056\n", + "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 4.433992\n", + "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 4.331242\n", + "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 3.656218\n", + "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 3.236688\n", + "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 2.764972\n", + "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 2.587098\n", + "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 2.090186\n", + "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 2.049698\n", + "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 1.641774\n", + "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 1.447641\n", + "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 1.294460\n", + "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 1.226808\n", + "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 0.847535\n", + "\n", + "Test set: Average loss: 2.5262\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 1.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 957.0/958(100%)\n", + "Class 7 accuracy: 795.0/1028(77%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12183 (0%)]\tLoss: 1.063643\n", + "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.945048\n", + "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.910895\n", + "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.803437\n", + "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.714711\n", + "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.731389\n", + "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.697865\n", + "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.518302\n", + "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.506918\n", + "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 0.638351\n", + "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.607182\n", + "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.582088\n", + "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.526564\n", + "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.453763\n", + "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 0.463578\n", + "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.505179\n", + "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 0.390394\n", + "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.431393\n", + "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.422808\n", + "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.379329\n", + "\n", + "Test set: Average loss: 3.8944\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 954.0/958(100%)\n", + "Class 7 accuracy: 1005.0/1028(98%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.411217\n", + "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.430715\n", + "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.321807\n", + "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.305609\n", + "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.329529\n", + "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.344710\n", + "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.351153\n", + "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.355009\n", + "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.316889\n", + "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.268590\n", + "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.269210\n", + "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.272690\n", + "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.299527\n", + "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.294239\n", + "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.256061\n", + "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.263354\n", + "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.266107\n", + "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.301182\n", + "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.221701\n", + "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.256709\n", + "\n", + "Test set: Average loss: 4.6037\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 954.0/958(100%)\n", + "Class 7 accuracy: 1012.0/1028(98%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12183 (0%)]\tLoss: 0.200790\n", + "Train Epoch: 4 [640/12183 (5%)]\tLoss: 0.200424\n", + "Train Epoch: 4 [1280/12183 (10%)]\tLoss: 0.190599\n", + "Train Epoch: 4 [1920/12183 (16%)]\tLoss: 0.205490\n", + "Train Epoch: 4 [2560/12183 (21%)]\tLoss: 0.245161\n", + "Train Epoch: 4 [3200/12183 (26%)]\tLoss: 0.154059\n", + "Train Epoch: 4 [3840/12183 (31%)]\tLoss: 0.181401\n", + "Train Epoch: 4 [4480/12183 (37%)]\tLoss: 0.283187\n", + "Train Epoch: 4 [5120/12183 (42%)]\tLoss: 0.176126\n", + "Train Epoch: 4 [5760/12183 (47%)]\tLoss: 0.218665\n", + "Train Epoch: 4 [6400/12183 (52%)]\tLoss: 0.294239\n", + "Train Epoch: 4 [7040/12183 (58%)]\tLoss: 0.213903\n", + "Train Epoch: 4 [7680/12183 (63%)]\tLoss: 0.233052\n", + "Train Epoch: 4 [8320/12183 (68%)]\tLoss: 0.161038\n", + "Train Epoch: 4 [8960/12183 (73%)]\tLoss: 0.211654\n", + "Train Epoch: 4 [9600/12183 (79%)]\tLoss: 0.192449\n", + "Train Epoch: 4 [10240/12183 (84%)]\tLoss: 0.161328\n", + "Train Epoch: 4 [10880/12183 (89%)]\tLoss: 0.197734\n", + "Train Epoch: 4 [11520/12183 (94%)]\tLoss: 0.191102\n", + "Train Epoch: 4 [4370/12183 (99%)]\tLoss: 0.376056\n", + "\n", + "Test set: Average loss: 4.9524\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 955.0/958(100%)\n", + "Class 7 accuracy: 1013.0/1028(99%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12183 (0%)]\tLoss: 0.250694\n", + "Train Epoch: 5 [640/12183 (5%)]\tLoss: 0.137549\n", + "Train Epoch: 5 [1280/12183 (10%)]\tLoss: 0.179946\n", + "Train Epoch: 5 [1920/12183 (16%)]\tLoss: 0.172115\n", + "Train Epoch: 5 [2560/12183 (21%)]\tLoss: 0.216046\n", + "Train Epoch: 5 [3200/12183 (26%)]\tLoss: 0.137594\n", + "Train Epoch: 5 [3840/12183 (31%)]\tLoss: 0.167268\n", + "Train Epoch: 5 [4480/12183 (37%)]\tLoss: 0.215348\n", + "Train Epoch: 5 [5120/12183 (42%)]\tLoss: 0.190677\n", + "Train Epoch: 5 [5760/12183 (47%)]\tLoss: 0.143424\n", + "Train Epoch: 5 [6400/12183 (52%)]\tLoss: 0.176460\n", + "Train Epoch: 5 [7040/12183 (58%)]\tLoss: 0.115466\n", + "Train Epoch: 5 [7680/12183 (63%)]\tLoss: 0.123880\n", + "Train Epoch: 5 [8320/12183 (68%)]\tLoss: 0.172899\n", + "Train Epoch: 5 [8960/12183 (73%)]\tLoss: 0.121368\n", + "Train Epoch: 5 [9600/12183 (79%)]\tLoss: 0.117190\n", + "Train Epoch: 5 [10240/12183 (84%)]\tLoss: 0.193983\n", + "Train Epoch: 5 [10880/12183 (89%)]\tLoss: 0.137996\n", + "Train Epoch: 5 [11520/12183 (94%)]\tLoss: 0.165303\n", + "Train Epoch: 5 [4370/12183 (99%)]\tLoss: 0.120738\n", + "\n", + "Test set: Average loss: 5.1628\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 955.0/958(100%)\n", + "Class 7 accuracy: 1014.0/1028(99%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/11800 (0%)]\tLoss: 8.108945\n", + "Train Epoch: 1 [640/11800 (5%)]\tLoss: 7.738531\n", + "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 6.640255\n", + "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 6.513710\n", + "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 5.460023\n", + "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 5.351851\n", + "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 4.810606\n", + "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 4.409184\n", + "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 3.466255\n", + "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 3.398129\n", + "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 2.812559\n", + "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 2.539098\n", + "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 1.932615\n", + "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 1.948097\n", + "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 1.529168\n", + "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 1.568914\n", + "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 1.332329\n", + "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 1.441239\n", + "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 1.161227\n", + "\n", + "Test set: Average loss: 2.4228\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 485.0/958(51%)\n", + "Class 7 accuracy: 345.0/1028(34%)\n", + "Class 8 accuracy: 962.0/974(99%)\n", + "Class 9 accuracy: 735.0/1009(73%)\n", + "Train Epoch: 2 [0/11800 (0%)]\tLoss: 1.033281\n", + "Train Epoch: 2 [640/11800 (5%)]\tLoss: 1.074798\n", + "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 1.087005\n", + "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 1.221566\n", + "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 1.020146\n", + "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 1.010463\n", + "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.871487\n", + "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.892453\n", + "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.761051\n", + "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.883746\n", + "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.881131\n", + "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.761468\n", + "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.702959\n", + "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.575911\n", + "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.668820\n", + "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.780607\n", + "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.565945\n", + "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.687550\n", + "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.551138\n", + "\n", + "Test set: Average loss: 3.3994\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 940.0/974(97%)\n", + "Class 9 accuracy: 914.0/1009(91%)\n", + "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.637666\n", + "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.512363\n", + "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.587236\n", + "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.496453\n", + "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.617932\n", + "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.538651\n", + "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.471803\n", + "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.569236\n", + "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.473018\n", + "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.661038\n", + "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.436601\n", + "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.551020\n", + "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.422065\n", + "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.436460\n", + "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.521548\n", + "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.582636\n", + "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.460395\n", + "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.637835\n", + "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.514315\n", + "\n", + "Test set: Average loss: 3.9214\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 934.0/974(96%)\n", + "Class 9 accuracy: 939.0/1009(93%)\n", + "Train Epoch: 4 [0/11800 (0%)]\tLoss: 0.498162\n", + "Train Epoch: 4 [640/11800 (5%)]\tLoss: 0.536717\n", + "Train Epoch: 4 [1280/11800 (11%)]\tLoss: 0.436568\n", + "Train Epoch: 4 [1920/11800 (16%)]\tLoss: 0.471787\n", + "Train Epoch: 4 [2560/11800 (22%)]\tLoss: 0.497887\n", + "Train Epoch: 4 [3200/11800 (27%)]\tLoss: 0.444460\n", + "Train Epoch: 4 [3840/11800 (32%)]\tLoss: 0.448744\n", + "Train Epoch: 4 [4480/11800 (38%)]\tLoss: 0.372841\n", + "Train Epoch: 4 [5120/11800 (43%)]\tLoss: 0.465649\n", + "Train Epoch: 4 [5760/11800 (49%)]\tLoss: 0.490277\n", + "Train Epoch: 4 [6400/11800 (54%)]\tLoss: 0.463720\n", + "Train Epoch: 4 [7040/11800 (59%)]\tLoss: 0.355945\n", + "Train Epoch: 4 [7680/11800 (65%)]\tLoss: 0.438429\n", + "Train Epoch: 4 [8320/11800 (70%)]\tLoss: 0.508788\n", + "Train Epoch: 4 [8960/11800 (76%)]\tLoss: 0.413552\n", + "Train Epoch: 4 [9600/11800 (81%)]\tLoss: 0.395993\n", + "Train Epoch: 4 [10240/11800 (86%)]\tLoss: 0.410553\n", + "Train Epoch: 4 [10880/11800 (92%)]\tLoss: 0.409377\n", + "Train Epoch: 4 [11520/11800 (97%)]\tLoss: 0.400534\n", + "\n", + "Test set: Average loss: 4.2109\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 930.0/974(95%)\n", + "Class 9 accuracy: 948.0/1009(94%)\n", + "Train Epoch: 5 [0/11800 (0%)]\tLoss: 0.441779\n", + "Train Epoch: 5 [640/11800 (5%)]\tLoss: 0.349478\n", + "Train Epoch: 5 [1280/11800 (11%)]\tLoss: 0.347695\n", + "Train Epoch: 5 [1920/11800 (16%)]\tLoss: 0.374920\n", + "Train Epoch: 5 [2560/11800 (22%)]\tLoss: 0.371782\n", + "Train Epoch: 5 [3200/11800 (27%)]\tLoss: 0.405380\n", + "Train Epoch: 5 [3840/11800 (32%)]\tLoss: 0.493990\n", + "Train Epoch: 5 [4480/11800 (38%)]\tLoss: 0.383761\n", + "Train Epoch: 5 [5120/11800 (43%)]\tLoss: 0.361125\n", + "Train Epoch: 5 [5760/11800 (49%)]\tLoss: 0.377500\n", + "Train Epoch: 5 [6400/11800 (54%)]\tLoss: 0.411204\n", + "Train Epoch: 5 [7040/11800 (59%)]\tLoss: 0.467779\n", + "Train Epoch: 5 [7680/11800 (65%)]\tLoss: 0.445416\n", + "Train Epoch: 5 [8320/11800 (70%)]\tLoss: 0.303449\n", + "Train Epoch: 5 [8960/11800 (76%)]\tLoss: 0.319432\n", + "Train Epoch: 5 [9600/11800 (81%)]\tLoss: 0.331827\n", + "Train Epoch: 5 [10240/11800 (86%)]\tLoss: 0.377502\n", + "Train Epoch: 5 [10880/11800 (92%)]\tLoss: 0.406466\n", + "Train Epoch: 5 [11520/11800 (97%)]\tLoss: 0.405720\n", + "\n", + "Test set: Average loss: 4.3858\n", + "Class 0 accuracy: 0.0/980(0%)\n", + "Class 1 accuracy: 0.0/1135(0%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 929.0/974(95%)\n", + "Class 9 accuracy: 950.0/1009(94%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 5.571240\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 5.058652\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 4.223537\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 3.769430\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 3.397155\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 3.066763\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 2.407099\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 2.510794\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.850332\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.656529\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.517869\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.028974\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.833506\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.765792\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.600499\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.491542\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.525203\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.473181\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.445249\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.329707\n", + "\n", + "Test set: Average loss: 2.6586\n", + "Class 0 accuracy: 974.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 616.0/1009(61%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.174450\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.286020\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.380822\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.200067\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.233174\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.215359\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.261502\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.193090\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.201911\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.123239\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.151434\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.161058\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.121602\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.152282\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.138010\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.116535\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.148996\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.094655\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.093630\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.100545\n", + "\n", + "Test set: Average loss: 3.7860\n", + "Class 0 accuracy: 974.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.113853\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.061060\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.073625\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.089106\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.100265\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.086965\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.078005\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.089567\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.083796\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.091500\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.071154\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.063725\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.081232\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.063744\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.044772\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.056600\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.075639\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.059448\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.051801\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.045583\n", + "\n", + "Test set: Average loss: 4.3795\n", + "Class 0 accuracy: 974.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.073423\n", + "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.081250\n", + "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.107188\n", + "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.108589\n", + "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.074006\n", + "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.038409\n", + "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.065204\n", + "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.083654\n", + "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.073944\n", + "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.048630\n", + "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.041222\n", + "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.055742\n", + "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.048848\n", + "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.099426\n", + "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.050589\n", + "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.039493\n", + "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.059188\n", + "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.071380\n", + "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.095400\n", + "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.052493\n", + "\n", + "Test set: Average loss: 4.6909\n", + "Class 0 accuracy: 975.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.042433\n", + "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.045415\n", + "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.045671\n", + "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.116742\n", + "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.042136\n", + "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.053295\n", + "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.035618\n", + "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.055716\n", + "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.043886\n", + "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.052791\n", + "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.079626\n", + "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.044485\n", + "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.027041\n", + "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.041513\n", + "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.034053\n", + "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.028694\n", + "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.054827\n", + "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.182031\n", + "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.068930\n", + "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.022576\n", + "\n", + "Test set: Average loss: 4.8702\n", + "Class 0 accuracy: 976.0/980(100%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n" + ] + } + ] + }, + { + "cell_type": "code", + "source": [ + "# Exercise 2: Implementing the previous exercise should have shown that the network\n", + "# suffers from catastrophic forgetting. To fix this, implement a memory replay buffer\n", + "# and use this buffer to counteract the catastrophic forgetting.\n", + "#\n", + "# Implementation requires adaptation of the cells above, plus the addition of a new\n", + "# experiment setup below.\n", + "\n", + "\n", + "### START SOLUTION ###\n", + "# The experiment setup is identical to the one above, but now we initialize and use\n", + "# a replay buffer. Right now, the buffer only stores a single image for each class.\n", + "# As a bonus exercise, explore how different variants of the replay buffer affect the\n", + "# resulting model performance.\n", + "\n", + "def train_memory_replay():\n", + " model = Net()\n", + " history = []\n", + " buffer = Buffer()\n", + "\n", + " config.train_classes = [0, 1]\n", + " train_model(config, model, phase = \"0_1\", history = history, buffer = buffer)\n", + " \n", + " config.train_classes = [2, 3]\n", + " train_model(config, model, phase = \"2_3\", history = history, buffer = buffer)\n", + "\n", + " config.train_classes = [4, 5]\n", + " train_model(config, model, phase = \"4_5\", history = history, buffer = buffer)\n", + "\n", + " config.train_classes = [6, 7]\n", + " train_model(config, model, phase = \"6_7\", history = history, buffer = buffer)\n", + "\n", + " config.train_classes = [8, 9]\n", + " train_model(config, model, phase = \"8_9\", history = history, buffer = buffer)\n", + " \n", + " config.train_classes = [0, 1]\n", + " train_model(config, model, phase = \"0_1_again\", history = history, buffer = buffer)\n", + "\n", + " return history\n", + "\n", + "### END SOLUTION ###\n", + "\n", + "history_memory_replay = train_memory_replay()\n", + "history_memory_replay" + ], + "metadata": { + "colab": { + "base_uri": "https://localhost:8080/" + }, + "id": "LtWvHl_tQCpg", + "outputId": "e4913ffb-5f2b-474f-d24a-bde139af833c" + }, + "execution_count": 16, + "outputs": [ + { + "output_type": "stream", + "name": "stdout", + "text": [ + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.295792\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 2.208695\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 2.106677\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 1.961109\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 1.898052\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 1.824553\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 1.719246\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 1.623634\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.617715\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.727536\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.507114\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.447730\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 1.549878\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 1.058249\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 1.447155\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 1.273197\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 1.260120\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 1.187015\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 1.091164\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.971557\n", + "\n", + "Test set: Average loss: 2.7060\n", + "Class 0 accuracy: 972.0/980(99%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.952087\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.869477\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.858798\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.809786\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.799570\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.890806\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.805940\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 1.059435\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.478667\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.673640\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.538314\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.710136\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.516661\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.602048\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.384920\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.435023\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.372631\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.426314\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.539168\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.321303\n", + "\n", + "Test set: Average loss: 3.8263\n", + "Class 0 accuracy: 966.0/980(99%)\n", + "Class 1 accuracy: 1135.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.401120\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.263190\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.398854\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.229336\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.240626\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.239559\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.418891\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.177813\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.226682\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.215379\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.211677\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.224589\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.253302\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.212234\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.230823\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.164656\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.154504\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.100245\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.156521\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.232217\n", + "\n", + "Test set: Average loss: 4.6647\n", + "Class 0 accuracy: 963.0/980(98%)\n", + "Class 1 accuracy: 1135.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.131072\n", + "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.227836\n", + "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.161914\n", + "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.182439\n", + "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.123449\n", + "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.118936\n", + "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.132258\n", + "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.191232\n", + "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.192155\n", + "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.122639\n", + "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.138319\n", + "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.106367\n", + "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.078942\n", + "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.103141\n", + "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.129387\n", + "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.117389\n", + "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.164451\n", + "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.216510\n", + "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.110041\n", + "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.104683\n", + "\n", + "Test set: Average loss: 5.1577\n", + "Class 0 accuracy: 966.0/980(99%)\n", + "Class 1 accuracy: 1135.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.077715\n", + "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.105138\n", + "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.124953\n", + "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.080610\n", + "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.123617\n", + "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.112670\n", + "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.093631\n", + "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.122231\n", + "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.093652\n", + "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.167812\n", + "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.117981\n", + "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.066692\n", + "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.080171\n", + "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.092669\n", + "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.146656\n", + "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.101289\n", + "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.089997\n", + "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.108752\n", + "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.078000\n", + "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.046221\n", + "\n", + "Test set: Average loss: 5.4729\n", + "Class 0 accuracy: 968.0/980(99%)\n", + "Class 1 accuracy: 1135.0/1135(100%)\n", + "Class 2 accuracy: 0.0/1032(0%)\n", + "Class 3 accuracy: 0.0/1010(0%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/12089 (0%)]\tLoss: 1.166433\n", + "Train Epoch: 1 [640/12089 (5%)]\tLoss: 1.153999\n", + "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 1.238186\n", + "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 1.274190\n", + "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 1.001455\n", + "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 0.980768\n", + "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 0.890982\n", + "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 0.845770\n", + "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 0.915158\n", + "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 0.577478\n", + "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 0.558826\n", + "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 0.697927\n", + "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 0.780273\n", + "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 0.586348\n", + "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 0.634719\n", + "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 0.753965\n", + "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 0.886030\n", + "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 0.913329\n", + "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 0.726805\n", + "\n", + "Test set: Average loss: 2.9830\n", + "Class 0 accuracy: 966.0/980(99%)\n", + "Class 1 accuracy: 1132.0/1135(100%)\n", + "Class 2 accuracy: 109.0/1032(11%)\n", + "Class 3 accuracy: 668.0/1010(66%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12089 (0%)]\tLoss: 0.903527\n", + "Train Epoch: 2 [640/12089 (5%)]\tLoss: 0.690564\n", + "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 1.054734\n", + "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.668291\n", + "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.846006\n", + "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.862174\n", + "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 1.078590\n", + "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.812564\n", + "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.751745\n", + "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.819927\n", + "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.641764\n", + "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.941192\n", + "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 1.113382\n", + "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.745287\n", + "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.845461\n", + "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.675010\n", + "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.772856\n", + "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.668837\n", + "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.776711\n", + "\n", + "Test set: Average loss: 3.1608\n", + "Class 0 accuracy: 828.0/980(84%)\n", + "Class 1 accuracy: 1091.0/1135(96%)\n", + "Class 2 accuracy: 898.0/1032(87%)\n", + "Class 3 accuracy: 983.0/1010(97%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.733399\n", + "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.793913\n", + "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.580512\n", + "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.477269\n", + "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.833255\n", + "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.636208\n", + "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.573351\n", + "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.656650\n", + "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.692221\n", + "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.723047\n", + "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.626788\n", + "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.557750\n", + "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.643362\n", + "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.725737\n", + "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.868968\n", + "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.720436\n", + "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.723306\n", + "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.624521\n", + "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.507009\n", + "\n", + "Test set: Average loss: 3.3136\n", + "Class 0 accuracy: 780.0/980(80%)\n", + "Class 1 accuracy: 1067.0/1135(94%)\n", + "Class 2 accuracy: 917.0/1032(89%)\n", + "Class 3 accuracy: 983.0/1010(97%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12089 (0%)]\tLoss: 0.624655\n", + "Train Epoch: 4 [640/12089 (5%)]\tLoss: 0.452378\n", + "Train Epoch: 4 [1280/12089 (11%)]\tLoss: 0.457449\n", + "Train Epoch: 4 [1920/12089 (16%)]\tLoss: 0.554645\n", + "Train Epoch: 4 [2560/12089 (21%)]\tLoss: 0.621985\n", + "Train Epoch: 4 [3200/12089 (26%)]\tLoss: 0.527864\n", + "Train Epoch: 4 [3840/12089 (32%)]\tLoss: 0.577068\n", + "Train Epoch: 4 [4480/12089 (37%)]\tLoss: 0.514906\n", + "Train Epoch: 4 [5120/12089 (42%)]\tLoss: 0.581334\n", + "Train Epoch: 4 [5760/12089 (48%)]\tLoss: 0.331880\n", + "Train Epoch: 4 [6400/12089 (53%)]\tLoss: 0.424212\n", + "Train Epoch: 4 [7040/12089 (58%)]\tLoss: 0.527507\n", + "Train Epoch: 4 [7680/12089 (63%)]\tLoss: 0.685347\n", + "Train Epoch: 4 [8320/12089 (69%)]\tLoss: 0.525770\n", + "Train Epoch: 4 [8960/12089 (74%)]\tLoss: 0.417910\n", + "Train Epoch: 4 [9600/12089 (79%)]\tLoss: 0.731371\n", + "Train Epoch: 4 [10240/12089 (85%)]\tLoss: 0.528346\n", + "Train Epoch: 4 [10880/12089 (90%)]\tLoss: 0.454048\n", + "Train Epoch: 4 [11520/12089 (95%)]\tLoss: 0.373003\n", + "\n", + "Test set: Average loss: 3.4222\n", + "Class 0 accuracy: 754.0/980(77%)\n", + "Class 1 accuracy: 1055.0/1135(93%)\n", + "Class 2 accuracy: 918.0/1032(89%)\n", + "Class 3 accuracy: 986.0/1010(98%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12089 (0%)]\tLoss: 0.546961\n", + "Train Epoch: 5 [640/12089 (5%)]\tLoss: 0.382696\n", + "Train Epoch: 5 [1280/12089 (11%)]\tLoss: 0.616167\n", + "Train Epoch: 5 [1920/12089 (16%)]\tLoss: 0.551108\n", + "Train Epoch: 5 [2560/12089 (21%)]\tLoss: 0.671682\n", + "Train Epoch: 5 [3200/12089 (26%)]\tLoss: 0.434367\n", + "Train Epoch: 5 [3840/12089 (32%)]\tLoss: 0.589797\n", + "Train Epoch: 5 [4480/12089 (37%)]\tLoss: 0.462255\n", + "Train Epoch: 5 [5120/12089 (42%)]\tLoss: 0.427646\n", + "Train Epoch: 5 [5760/12089 (48%)]\tLoss: 0.393138\n", + "Train Epoch: 5 [6400/12089 (53%)]\tLoss: 0.374952\n", + "Train Epoch: 5 [7040/12089 (58%)]\tLoss: 0.392871\n", + "Train Epoch: 5 [7680/12089 (63%)]\tLoss: 0.494981\n", + "Train Epoch: 5 [8320/12089 (69%)]\tLoss: 0.474602\n", + "Train Epoch: 5 [8960/12089 (74%)]\tLoss: 0.418477\n", + "Train Epoch: 5 [9600/12089 (79%)]\tLoss: 0.402891\n", + "Train Epoch: 5 [10240/12089 (85%)]\tLoss: 0.545055\n", + "Train Epoch: 5 [10880/12089 (90%)]\tLoss: 0.465828\n", + "Train Epoch: 5 [11520/12089 (95%)]\tLoss: 0.378968\n", + "\n", + "Test set: Average loss: 3.4964\n", + "Class 0 accuracy: 743.0/980(76%)\n", + "Class 1 accuracy: 1053.0/1135(93%)\n", + "Class 2 accuracy: 928.0/1032(90%)\n", + "Class 3 accuracy: 986.0/1010(98%)\n", + "Class 4 accuracy: 0.0/982(0%)\n", + "Class 5 accuracy: 0.0/892(0%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/11263 (0%)]\tLoss: 0.850781\n", + "Train Epoch: 1 [640/11263 (6%)]\tLoss: 0.798292\n", + "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 0.834117\n", + "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 0.725765\n", + "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 0.676635\n", + "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 0.758110\n", + "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 0.689677\n", + "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 0.686142\n", + "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 0.819930\n", + "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 0.822826\n", + "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 0.597154\n", + "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 0.712456\n", + "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 0.668146\n", + "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 0.641806\n", + "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 0.607866\n", + "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 0.837627\n", + "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 0.767775\n", + "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 0.710244\n", + "\n", + "Test set: Average loss: 2.3788\n", + "Class 0 accuracy: 936.0/980(96%)\n", + "Class 1 accuracy: 1123.0/1135(99%)\n", + "Class 2 accuracy: 808.0/1032(78%)\n", + "Class 3 accuracy: 926.0/1010(92%)\n", + "Class 4 accuracy: 790.0/982(80%)\n", + "Class 5 accuracy: 360.0/892(40%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/11263 (0%)]\tLoss: 0.896705\n", + "Train Epoch: 2 [640/11263 (6%)]\tLoss: 0.905773\n", + "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 0.899539\n", + "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 0.838611\n", + "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 0.892302\n", + "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 1.038975\n", + "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 0.937163\n", + "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 0.748620\n", + "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 0.863919\n", + "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 1.029196\n", + "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.845210\n", + "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.758227\n", + "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.620243\n", + "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.842112\n", + "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.743856\n", + "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.656504\n", + "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.817470\n", + "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.658012\n", + "\n", + "Test set: Average loss: 2.4907\n", + "Class 0 accuracy: 789.0/980(81%)\n", + "Class 1 accuracy: 1107.0/1135(98%)\n", + "Class 2 accuracy: 670.0/1032(65%)\n", + "Class 3 accuracy: 515.0/1010(51%)\n", + "Class 4 accuracy: 942.0/982(96%)\n", + "Class 5 accuracy: 766.0/892(86%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.754302\n", + "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.660190\n", + "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.655176\n", + "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.696439\n", + "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.786622\n", + "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.699489\n", + "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.776751\n", + "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.755700\n", + "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.776476\n", + "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.718861\n", + "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.644046\n", + "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.879339\n", + "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.587297\n", + "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.763207\n", + "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.761769\n", + "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.656073\n", + "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.616851\n", + "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.573584\n", + "\n", + "Test set: Average loss: 2.5840\n", + "Class 0 accuracy: 754.0/980(77%)\n", + "Class 1 accuracy: 1089.0/1135(96%)\n", + "Class 2 accuracy: 640.0/1032(62%)\n", + "Class 3 accuracy: 371.0/1010(37%)\n", + "Class 4 accuracy: 960.0/982(98%)\n", + "Class 5 accuracy: 800.0/892(90%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/11263 (0%)]\tLoss: 0.648252\n", + "Train Epoch: 4 [640/11263 (6%)]\tLoss: 0.596721\n", + "Train Epoch: 4 [1280/11263 (11%)]\tLoss: 0.558993\n", + "Train Epoch: 4 [1920/11263 (17%)]\tLoss: 0.492765\n", + "Train Epoch: 4 [2560/11263 (23%)]\tLoss: 0.646996\n", + "Train Epoch: 4 [3200/11263 (28%)]\tLoss: 0.737724\n", + "Train Epoch: 4 [3840/11263 (34%)]\tLoss: 0.578851\n", + "Train Epoch: 4 [4480/11263 (40%)]\tLoss: 0.646620\n", + "Train Epoch: 4 [5120/11263 (45%)]\tLoss: 0.652254\n", + "Train Epoch: 4 [5760/11263 (51%)]\tLoss: 0.631144\n", + "Train Epoch: 4 [6400/11263 (57%)]\tLoss: 0.702145\n", + "Train Epoch: 4 [7040/11263 (62%)]\tLoss: 0.601468\n", + "Train Epoch: 4 [7680/11263 (68%)]\tLoss: 0.567884\n", + "Train Epoch: 4 [8320/11263 (74%)]\tLoss: 0.487138\n", + "Train Epoch: 4 [8960/11263 (80%)]\tLoss: 0.673586\n", + "Train Epoch: 4 [9600/11263 (85%)]\tLoss: 0.492252\n", + "Train Epoch: 4 [10240/11263 (91%)]\tLoss: 0.645415\n", + "Train Epoch: 4 [10880/11263 (97%)]\tLoss: 0.587828\n", + "\n", + "Test set: Average loss: 2.6582\n", + "Class 0 accuracy: 731.0/980(75%)\n", + "Class 1 accuracy: 1086.0/1135(96%)\n", + "Class 2 accuracy: 631.0/1032(61%)\n", + "Class 3 accuracy: 293.0/1010(29%)\n", + "Class 4 accuracy: 959.0/982(98%)\n", + "Class 5 accuracy: 817.0/892(92%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/11263 (0%)]\tLoss: 0.693316\n", + "Train Epoch: 5 [640/11263 (6%)]\tLoss: 0.579783\n", + "Train Epoch: 5 [1280/11263 (11%)]\tLoss: 0.606642\n", + "Train Epoch: 5 [1920/11263 (17%)]\tLoss: 0.578930\n", + "Train Epoch: 5 [2560/11263 (23%)]\tLoss: 0.593126\n", + "Train Epoch: 5 [3200/11263 (28%)]\tLoss: 0.568712\n", + "Train Epoch: 5 [3840/11263 (34%)]\tLoss: 0.730927\n", + "Train Epoch: 5 [4480/11263 (40%)]\tLoss: 0.517850\n", + "Train Epoch: 5 [5120/11263 (45%)]\tLoss: 0.595436\n", + "Train Epoch: 5 [5760/11263 (51%)]\tLoss: 0.623922\n", + "Train Epoch: 5 [6400/11263 (57%)]\tLoss: 0.477650\n", + "Train Epoch: 5 [7040/11263 (62%)]\tLoss: 0.672610\n", + "Train Epoch: 5 [7680/11263 (68%)]\tLoss: 0.543774\n", + "Train Epoch: 5 [8320/11263 (74%)]\tLoss: 0.580296\n", + "Train Epoch: 5 [8960/11263 (80%)]\tLoss: 0.583141\n", + "Train Epoch: 5 [9600/11263 (85%)]\tLoss: 0.448098\n", + "Train Epoch: 5 [10240/11263 (91%)]\tLoss: 0.625687\n", + "Train Epoch: 5 [10880/11263 (97%)]\tLoss: 0.533021\n", + "\n", + "Test set: Average loss: 2.7075\n", + "Class 0 accuracy: 719.0/980(73%)\n", + "Class 1 accuracy: 1080.0/1135(95%)\n", + "Class 2 accuracy: 629.0/1032(61%)\n", + "Class 3 accuracy: 287.0/1010(28%)\n", + "Class 4 accuracy: 959.0/982(98%)\n", + "Class 5 accuracy: 834.0/892(93%)\n", + "Class 6 accuracy: 0.0/958(0%)\n", + "Class 7 accuracy: 0.0/1028(0%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/12183 (0%)]\tLoss: 0.851070\n", + "Train Epoch: 1 [640/12183 (5%)]\tLoss: 0.703527\n", + "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 0.862511\n", + "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 0.664779\n", + "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 0.622195\n", + "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 0.686788\n", + "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 0.766821\n", + "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 0.635133\n", + "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 0.673985\n", + "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 0.736285\n", + "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 0.763070\n", + "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 0.914076\n", + "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 0.897798\n", + "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 0.769690\n", + "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 0.705697\n", + "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 0.890666\n", + "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 0.964875\n", + "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 0.846083\n", + "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 0.977361\n", + "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 1.044579\n", + "\n", + "Test set: Average loss: 1.6683\n", + "Class 0 accuracy: 839.0/980(86%)\n", + "Class 1 accuracy: 1086.0/1135(96%)\n", + "Class 2 accuracy: 547.0/1032(53%)\n", + "Class 3 accuracy: 854.0/1010(85%)\n", + "Class 4 accuracy: 673.0/982(69%)\n", + "Class 5 accuracy: 311.0/892(35%)\n", + "Class 6 accuracy: 878.0/958(92%)\n", + "Class 7 accuracy: 904.0/1028(88%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 2 [0/12183 (0%)]\tLoss: 0.782327\n", + "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.875331\n", + "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.926851\n", + "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.874468\n", + "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.925109\n", + "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.954436\n", + "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.942288\n", + "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.940796\n", + "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.857594\n", + "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 1.031697\n", + "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.929081\n", + "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.983720\n", + "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.876552\n", + "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.934435\n", + "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 1.003677\n", + "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.931277\n", + "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 1.008535\n", + "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.810847\n", + "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.702577\n", + "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.964019\n", + "\n", + "Test set: Average loss: 1.6425\n", + "Class 0 accuracy: 804.0/980(82%)\n", + "Class 1 accuracy: 1065.0/1135(94%)\n", + "Class 2 accuracy: 527.0/1032(51%)\n", + "Class 3 accuracy: 774.0/1010(77%)\n", + "Class 4 accuracy: 629.0/982(64%)\n", + "Class 5 accuracy: 347.0/892(39%)\n", + "Class 6 accuracy: 931.0/958(97%)\n", + "Class 7 accuracy: 983.0/1028(96%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.658189\n", + "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.624558\n", + "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.811082\n", + "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.653154\n", + "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.784420\n", + "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.620821\n", + "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.743391\n", + "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.694466\n", + "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.580736\n", + "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.673027\n", + "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.545014\n", + "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.924152\n", + "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.730344\n", + "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.724853\n", + "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.699868\n", + "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.697215\n", + "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.783108\n", + "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.672869\n", + "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.625879\n", + "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.598810\n", + "\n", + "Test set: Average loss: 1.6302\n", + "Class 0 accuracy: 797.0/980(81%)\n", + "Class 1 accuracy: 1062.0/1135(94%)\n", + "Class 2 accuracy: 526.0/1032(51%)\n", + "Class 3 accuracy: 762.0/1010(75%)\n", + "Class 4 accuracy: 657.0/982(67%)\n", + "Class 5 accuracy: 415.0/892(47%)\n", + "Class 6 accuracy: 938.0/958(98%)\n", + "Class 7 accuracy: 992.0/1028(96%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 4 [0/12183 (0%)]\tLoss: 0.686760\n", + "Train Epoch: 4 [640/12183 (5%)]\tLoss: 0.678613\n", + "Train Epoch: 4 [1280/12183 (10%)]\tLoss: 0.649789\n", + "Train Epoch: 4 [1920/12183 (16%)]\tLoss: 0.512429\n", + "Train Epoch: 4 [2560/12183 (21%)]\tLoss: 0.689496\n", + "Train Epoch: 4 [3200/12183 (26%)]\tLoss: 0.608655\n", + "Train Epoch: 4 [3840/12183 (31%)]\tLoss: 0.553349\n", + "Train Epoch: 4 [4480/12183 (37%)]\tLoss: 0.538118\n", + "Train Epoch: 4 [5120/12183 (42%)]\tLoss: 0.461560\n", + "Train Epoch: 4 [5760/12183 (47%)]\tLoss: 0.588525\n", + "Train Epoch: 4 [6400/12183 (52%)]\tLoss: 0.508286\n", + "Train Epoch: 4 [7040/12183 (58%)]\tLoss: 0.540536\n", + "Train Epoch: 4 [7680/12183 (63%)]\tLoss: 0.479708\n", + "Train Epoch: 4 [8320/12183 (68%)]\tLoss: 0.501095\n", + "Train Epoch: 4 [8960/12183 (73%)]\tLoss: 0.469510\n", + "Train Epoch: 4 [9600/12183 (79%)]\tLoss: 0.497756\n", + "Train Epoch: 4 [10240/12183 (84%)]\tLoss: 0.523196\n", + "Train Epoch: 4 [10880/12183 (89%)]\tLoss: 0.555491\n", + "Train Epoch: 4 [11520/12183 (94%)]\tLoss: 0.515540\n", + "Train Epoch: 4 [4370/12183 (99%)]\tLoss: 0.572875\n", + "\n", + "Test set: Average loss: 1.6347\n", + "Class 0 accuracy: 788.0/980(80%)\n", + "Class 1 accuracy: 1063.0/1135(94%)\n", + "Class 2 accuracy: 534.0/1032(52%)\n", + "Class 3 accuracy: 769.0/1010(76%)\n", + "Class 4 accuracy: 672.0/982(68%)\n", + "Class 5 accuracy: 440.0/892(49%)\n", + "Class 6 accuracy: 940.0/958(98%)\n", + "Class 7 accuracy: 996.0/1028(97%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 5 [0/12183 (0%)]\tLoss: 0.595143\n", + "Train Epoch: 5 [640/12183 (5%)]\tLoss: 0.550319\n", + "Train Epoch: 5 [1280/12183 (10%)]\tLoss: 0.548414\n", + "Train Epoch: 5 [1920/12183 (16%)]\tLoss: 0.511655\n", + "Train Epoch: 5 [2560/12183 (21%)]\tLoss: 0.401490\n", + "Train Epoch: 5 [3200/12183 (26%)]\tLoss: 0.400202\n", + "Train Epoch: 5 [3840/12183 (31%)]\tLoss: 0.397857\n", + "Train Epoch: 5 [4480/12183 (37%)]\tLoss: 0.479915\n", + "Train Epoch: 5 [5120/12183 (42%)]\tLoss: 0.408378\n", + "Train Epoch: 5 [5760/12183 (47%)]\tLoss: 0.431881\n", + "Train Epoch: 5 [6400/12183 (52%)]\tLoss: 0.429216\n", + "Train Epoch: 5 [7040/12183 (58%)]\tLoss: 0.347318\n", + "Train Epoch: 5 [7680/12183 (63%)]\tLoss: 0.549904\n", + "Train Epoch: 5 [8320/12183 (68%)]\tLoss: 0.484814\n", + "Train Epoch: 5 [8960/12183 (73%)]\tLoss: 0.430466\n", + "Train Epoch: 5 [9600/12183 (79%)]\tLoss: 0.517198\n", + "Train Epoch: 5 [10240/12183 (84%)]\tLoss: 0.395947\n", + "Train Epoch: 5 [10880/12183 (89%)]\tLoss: 0.551409\n", + "Train Epoch: 5 [11520/12183 (94%)]\tLoss: 0.495534\n", + "Train Epoch: 5 [4370/12183 (99%)]\tLoss: 0.495679\n", + "\n", + "Test set: Average loss: 1.6534\n", + "Class 0 accuracy: 781.0/980(80%)\n", + "Class 1 accuracy: 1059.0/1135(93%)\n", + "Class 2 accuracy: 530.0/1032(51%)\n", + "Class 3 accuracy: 763.0/1010(76%)\n", + "Class 4 accuracy: 672.0/982(68%)\n", + "Class 5 accuracy: 444.0/892(50%)\n", + "Class 6 accuracy: 940.0/958(98%)\n", + "Class 7 accuracy: 1001.0/1028(97%)\n", + "Class 8 accuracy: 0.0/974(0%)\n", + "Class 9 accuracy: 0.0/1009(0%)\n", + "Train Epoch: 1 [0/11800 (0%)]\tLoss: 0.848253\n", + "Train Epoch: 1 [640/11800 (5%)]\tLoss: 0.637744\n", + "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 0.628570\n", + "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 0.461403\n", + "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 0.513085\n", + "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 0.590126\n", + "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 0.472829\n", + "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 0.592700\n", + "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 0.617516\n", + "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 0.555048\n", + "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 0.743809\n", + "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 0.765445\n", + "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 0.768416\n", + "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 0.777279\n", + "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 0.842107\n", + "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 0.796940\n", + "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 0.601572\n", + "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 0.841399\n", + "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 0.846165\n", + "\n", + "Test set: Average loss: 0.9925\n", + "Class 0 accuracy: 835.0/980(85%)\n", + "Class 1 accuracy: 1050.0/1135(93%)\n", + "Class 2 accuracy: 638.0/1032(62%)\n", + "Class 3 accuracy: 738.0/1010(73%)\n", + "Class 4 accuracy: 548.0/982(56%)\n", + "Class 5 accuracy: 170.0/892(19%)\n", + "Class 6 accuracy: 779.0/958(81%)\n", + "Class 7 accuracy: 776.0/1028(75%)\n", + "Class 8 accuracy: 908.0/974(93%)\n", + "Class 9 accuracy: 801.0/1009(79%)\n", + "Train Epoch: 2 [0/11800 (0%)]\tLoss: 0.883257\n", + "Train Epoch: 2 [640/11800 (5%)]\tLoss: 0.857211\n", + "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 0.841614\n", + "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 0.790240\n", + "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 0.950122\n", + "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 0.835133\n", + "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.882796\n", + "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.810285\n", + "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.799711\n", + "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.834429\n", + "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.839871\n", + "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.947290\n", + "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.710232\n", + "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.779843\n", + "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.733478\n", + "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.938040\n", + "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.839119\n", + "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.696384\n", + "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.752226\n", + "\n", + "Test set: Average loss: 0.9674\n", + "Class 0 accuracy: 825.0/980(84%)\n", + "Class 1 accuracy: 1004.0/1135(88%)\n", + "Class 2 accuracy: 599.0/1032(58%)\n", + "Class 3 accuracy: 615.0/1010(61%)\n", + "Class 4 accuracy: 332.0/982(34%)\n", + "Class 5 accuracy: 42.0/892(5%)\n", + "Class 6 accuracy: 762.0/958(80%)\n", + "Class 7 accuracy: 623.0/1028(61%)\n", + "Class 8 accuracy: 943.0/974(97%)\n", + "Class 9 accuracy: 923.0/1009(91%)\n", + "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.708711\n", + "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.783265\n", + "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.810831\n", + "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.753713\n", + "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.696868\n", + "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.572866\n", + "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.757275\n", + "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.732344\n", + "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.671541\n", + "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.724425\n", + "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.719062\n", + "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.712015\n", + "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.619695\n", + "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.781576\n", + "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.707311\n", + "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.700315\n", + "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.579610\n", + "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.836607\n", + "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.599106\n", + "\n", + "Test set: Average loss: 0.9365\n", + "Class 0 accuracy: 817.0/980(83%)\n", + "Class 1 accuracy: 996.0/1135(88%)\n", + "Class 2 accuracy: 598.0/1032(58%)\n", + "Class 3 accuracy: 612.0/1010(61%)\n", + "Class 4 accuracy: 291.0/982(30%)\n", + "Class 5 accuracy: 58.0/892(7%)\n", + "Class 6 accuracy: 772.0/958(81%)\n", + "Class 7 accuracy: 574.0/1028(56%)\n", + "Class 8 accuracy: 941.0/974(97%)\n", + "Class 9 accuracy: 948.0/1009(94%)\n", + "Train Epoch: 4 [0/11800 (0%)]\tLoss: 0.764324\n", + "Train Epoch: 4 [640/11800 (5%)]\tLoss: 0.750924\n", + "Train Epoch: 4 [1280/11800 (11%)]\tLoss: 0.597976\n", + "Train Epoch: 4 [1920/11800 (16%)]\tLoss: 0.711546\n", + "Train Epoch: 4 [2560/11800 (22%)]\tLoss: 0.744140\n", + "Train Epoch: 4 [3200/11800 (27%)]\tLoss: 0.756678\n", + "Train Epoch: 4 [3840/11800 (32%)]\tLoss: 0.566600\n", + "Train Epoch: 4 [4480/11800 (38%)]\tLoss: 0.728696\n", + "Train Epoch: 4 [5120/11800 (43%)]\tLoss: 0.720701\n", + "Train Epoch: 4 [5760/11800 (49%)]\tLoss: 0.566305\n", + "Train Epoch: 4 [6400/11800 (54%)]\tLoss: 0.689037\n", + "Train Epoch: 4 [7040/11800 (59%)]\tLoss: 0.678461\n", + "Train Epoch: 4 [7680/11800 (65%)]\tLoss: 0.550391\n", + "Train Epoch: 4 [8320/11800 (70%)]\tLoss: 0.694139\n", + "Train Epoch: 4 [8960/11800 (76%)]\tLoss: 0.700623\n", + "Train Epoch: 4 [9600/11800 (81%)]\tLoss: 0.623185\n", + "Train Epoch: 4 [10240/11800 (86%)]\tLoss: 0.696449\n", + "Train Epoch: 4 [10880/11800 (92%)]\tLoss: 0.732011\n", + "Train Epoch: 4 [11520/11800 (97%)]\tLoss: 0.734793\n", + "\n", + "Test set: Average loss: 0.9336\n", + "Class 0 accuracy: 809.0/980(83%)\n", + "Class 1 accuracy: 986.0/1135(87%)\n", + "Class 2 accuracy: 593.0/1032(57%)\n", + "Class 3 accuracy: 575.0/1010(57%)\n", + "Class 4 accuracy: 283.0/982(29%)\n", + "Class 5 accuracy: 60.0/892(7%)\n", + "Class 6 accuracy: 772.0/958(81%)\n", + "Class 7 accuracy: 550.0/1028(54%)\n", + "Class 8 accuracy: 943.0/974(97%)\n", + "Class 9 accuracy: 956.0/1009(95%)\n", + "Train Epoch: 5 [0/11800 (0%)]\tLoss: 0.598379\n", + "Train Epoch: 5 [640/11800 (5%)]\tLoss: 0.805639\n", + "Train Epoch: 5 [1280/11800 (11%)]\tLoss: 0.687005\n", + "Train Epoch: 5 [1920/11800 (16%)]\tLoss: 0.553637\n", + "Train Epoch: 5 [2560/11800 (22%)]\tLoss: 0.630970\n", + "Train Epoch: 5 [3200/11800 (27%)]\tLoss: 0.618934\n", + "Train Epoch: 5 [3840/11800 (32%)]\tLoss: 0.695465\n", + "Train Epoch: 5 [4480/11800 (38%)]\tLoss: 0.617699\n", + "Train Epoch: 5 [5120/11800 (43%)]\tLoss: 0.745449\n", + "Train Epoch: 5 [5760/11800 (49%)]\tLoss: 0.529404\n", + "Train Epoch: 5 [6400/11800 (54%)]\tLoss: 0.633640\n", + "Train Epoch: 5 [7040/11800 (59%)]\tLoss: 0.788254\n", + "Train Epoch: 5 [7680/11800 (65%)]\tLoss: 0.565721\n", + "Train Epoch: 5 [8320/11800 (70%)]\tLoss: 0.707190\n", + "Train Epoch: 5 [8960/11800 (76%)]\tLoss: 0.583630\n", + "Train Epoch: 5 [9600/11800 (81%)]\tLoss: 0.549434\n", + "Train Epoch: 5 [10240/11800 (86%)]\tLoss: 0.546574\n", + "Train Epoch: 5 [10880/11800 (92%)]\tLoss: 0.536187\n", + "Train Epoch: 5 [11520/11800 (97%)]\tLoss: 0.731755\n", + "\n", + "Test set: Average loss: 0.9307\n", + "Class 0 accuracy: 807.0/980(82%)\n", + "Class 1 accuracy: 977.0/1135(86%)\n", + "Class 2 accuracy: 588.0/1032(57%)\n", + "Class 3 accuracy: 548.0/1010(54%)\n", + "Class 4 accuracy: 283.0/982(29%)\n", + "Class 5 accuracy: 70.0/892(8%)\n", + "Class 6 accuracy: 772.0/958(81%)\n", + "Class 7 accuracy: 546.0/1028(53%)\n", + "Class 8 accuracy: 945.0/974(97%)\n", + "Class 9 accuracy: 958.0/1009(95%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 0.606930\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 0.566195\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 0.488845\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.440726\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.412488\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.525131\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.394614\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.449948\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.455428\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.374721\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.441609\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.499441\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.482373\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.431031\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.455554\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.415438\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.355638\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.477118\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.512437\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.351764\n", + "\n", + "Test set: Average loss: 0.8019\n", + "Class 0 accuracy: 968.0/980(99%)\n", + "Class 1 accuracy: 1130.0/1135(100%)\n", + "Class 2 accuracy: 604.0/1032(59%)\n", + "Class 3 accuracy: 753.0/1010(75%)\n", + "Class 4 accuracy: 673.0/982(69%)\n", + "Class 5 accuracy: 496.0/892(56%)\n", + "Class 6 accuracy: 695.0/958(73%)\n", + "Class 7 accuracy: 825.0/1028(80%)\n", + "Class 8 accuracy: 589.0/974(60%)\n", + "Class 9 accuracy: 751.0/1009(74%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.382221\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.359024\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.443718\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.352842\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.390380\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.450553\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.285430\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.317991\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.304995\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.402834\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.410913\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.323035\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.359033\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.332048\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.344597\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.363583\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.267385\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.303813\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.394272\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.275770\n", + "\n", + "Test set: Average loss: 0.7998\n", + "Class 0 accuracy: 970.0/980(99%)\n", + "Class 1 accuracy: 1130.0/1135(100%)\n", + "Class 2 accuracy: 586.0/1032(57%)\n", + "Class 3 accuracy: 743.0/1010(74%)\n", + "Class 4 accuracy: 675.0/982(69%)\n", + "Class 5 accuracy: 498.0/892(56%)\n", + "Class 6 accuracy: 686.0/958(72%)\n", + "Class 7 accuracy: 819.0/1028(80%)\n", + "Class 8 accuracy: 607.0/974(62%)\n", + "Class 9 accuracy: 756.0/1009(75%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.361247\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.295900\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.298250\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.288731\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.304051\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.301107\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.264046\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.236352\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.251096\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.369783\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.356867\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.247389\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.264304\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.243768\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.328787\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.294538\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.300040\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.258787\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.283641\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.338280\n", + "\n", + "Test set: Average loss: 0.7930\n", + "Class 0 accuracy: 971.0/980(99%)\n", + "Class 1 accuracy: 1130.0/1135(100%)\n", + "Class 2 accuracy: 589.0/1032(57%)\n", + "Class 3 accuracy: 741.0/1010(73%)\n", + "Class 4 accuracy: 671.0/982(68%)\n", + "Class 5 accuracy: 516.0/892(58%)\n", + "Class 6 accuracy: 685.0/958(72%)\n", + "Class 7 accuracy: 813.0/1028(79%)\n", + "Class 8 accuracy: 608.0/974(62%)\n", + "Class 9 accuracy: 755.0/1009(75%)\n", + "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.236698\n", + "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.221445\n", + "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.236138\n", + "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.257844\n", + "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.233735\n", + "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.222089\n", + "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.307528\n", + "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.285662\n", + "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.240001\n", + "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.292137\n", + "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.290430\n", + "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.299295\n", + "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.255210\n", + "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.203961\n", + "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.238729\n", + "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.249784\n", + "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.193929\n", + "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.198174\n", + "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.270540\n", + "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.217733\n", + "\n", + "Test set: Average loss: 0.8017\n", + "Class 0 accuracy: 971.0/980(99%)\n", + "Class 1 accuracy: 1130.0/1135(100%)\n", + "Class 2 accuracy: 575.0/1032(56%)\n", + "Class 3 accuracy: 736.0/1010(73%)\n", + "Class 4 accuracy: 671.0/982(68%)\n", + "Class 5 accuracy: 511.0/892(57%)\n", + "Class 6 accuracy: 682.0/958(71%)\n", + "Class 7 accuracy: 814.0/1028(79%)\n", + "Class 8 accuracy: 607.0/974(62%)\n", + "Class 9 accuracy: 750.0/1009(74%)\n", + "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.226164\n", + "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.318618\n", + "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.238432\n", + "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.262093\n", + "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.286501\n", + "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.219213\n", + "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.250186\n", + "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.270830\n", + "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.149153\n", + "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.206908\n", + "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.237038\n", + "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.289587\n", + "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.243903\n", + "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.234777\n", + "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.194367\n", + "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.248726\n", + "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.233232\n", + "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.258024\n", + "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.280726\n", + "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.206879\n", + "\n", + "Test set: Average loss: 0.8039\n", + "Class 0 accuracy: 971.0/980(99%)\n", + "Class 1 accuracy: 1130.0/1135(100%)\n", + "Class 2 accuracy: 575.0/1032(56%)\n", + "Class 3 accuracy: 739.0/1010(73%)\n", + "Class 4 accuracy: 672.0/982(68%)\n", + "Class 5 accuracy: 520.0/892(58%)\n", + "Class 6 accuracy: 676.0/958(71%)\n", + "Class 7 accuracy: 812.0/1028(79%)\n", + "Class 8 accuracy: 597.0/974(61%)\n", + "Class 9 accuracy: 746.0/1009(74%)\n" + ] + } + ] + }, + { + "cell_type": "markdown", + "metadata": { + "id": "8Yad6wstNUpx" + }, + "source": [ + "# Analysis of the results" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": { + "id": "gimHfUXdW4_K" + }, + "outputs": [], + "source": [ + "# The following helper code takes the logs and converts them into a dataframe\n", + "# for easier reading. You can also store the result as a CSV or HDF file by\n", + "# using the .to_csv and .to_hdf methods from pandas for later reading.\n", + "\n", + "import matplotlib.pyplot as plt\n", + "import pandas as pd\n", + "\n", + "def format_results(history):\n", + " logs = pd.DataFrame(history).round(2)\n", + " logs.index.name = 'epoch'\n", + " logs = logs.reset_index(drop = False)\n", + " return logs\n", + "\n", + "#display(format_results(history_regular_mnist).head())\n", + "#display(format_results(history_catastrophic_forgetting).head())\n", + "#display(format_results(history_memory_replay).head())" + ] + }, + { + "cell_type": "code", + "execution_count": null, + "metadata": { + "id": "jR6eRKn4WguU" + }, + "outputs": [], + "source": [ + "# Finally, we plot the results and optionally compare the three different training setups.\n", + "# Try to adapt and extend the plotting function to the needs of your experimental setup.\n", + "\n", + "import matplotlib.pyplot as plt\n", + "import seaborn as sns\n", + "\n", + "fig, axes = plt.subplots(10, 2,figsize = (5, 7), sharex = True)\n", + "\n", + "# Iterate over the different training setups for comparison\n", + "for log_id, logs in enumerate([history_catastrophic_forgetting, history_memory_replay]):\n", + " # Format the logs into a dataframe\n", + " logs = format_results(logs)\n", + " # Iterate through the 10 different MNIST classes (0...9). We will plot one subpanel\n", + " # for each of them, showing the accuracies for that particular class over the course\n", + " # of the entire training.\n", + " for class_ in range(10):\n", + " # Get the correct subpanel of the plot\n", + " ax = axes[class_, log_id]\n", + " \n", + " # Draw a line plot: The x axis will be the epoch, the y axis will be the accuarcy\n", + " # for predicting a particular class.\n", + " ax.plot(logs.epoch, logs[class_], color = 'black')\n", + " \n", + " # Finally, we will optimize the plot a bit and remove unneeded lines\n", + " ax.set_ylim([0, 1])\n", + " sns.despine(bottom = True, trim = True)\n", + "\n", + "axes[-1].set_xlabel(\"Epochs\")\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "source": [ + "Here are some example outputs:\n", + "\n", + "| With catastrophic forgetting | Training setup using a regularizer |\n", + "|-|-|\n", + "|![image.png]() |![image.png]() |" + ], + "metadata": { + "id": "5RolXP_mTxwp" + } + } + ], + "metadata": { + "accelerator": "GPU", + "colab": { + "gpuType": "T4", + "provenance": [] + }, + "gpuClass": "standard", + "kernelspec": { + "display_name": "Python 3 (ipykernel)", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.3" + } + }, + "nbformat": 4, + "nbformat_minor": 0 +} \ No newline at end of file From 950fa9eb836f89568f77b0283d6848741916b9fb Mon Sep 17 00:00:00 2001 From: Steffen Schneider Date: Wed, 24 May 2023 03:31:26 +0200 Subject: [PATCH 2/2] Generate a better result plot --- week11/week11.ipynb | 4246 ++++++++++++++++++++----------------------- 1 file changed, 1935 insertions(+), 2311 deletions(-) diff --git a/week11/week11.ipynb b/week11/week11.ipynb index aa4630d..5b175ec 100644 --- a/week11/week11.ipynb +++ b/week11/week11.ipynb @@ -24,7 +24,7 @@ }, { "cell_type": "code", - "execution_count": 2, + "execution_count": 1, "metadata": { "id": "MN_GMVuyPD9D" }, @@ -76,7 +76,7 @@ }, { "cell_type": "code", - "execution_count": 3, + "execution_count": 2, "metadata": { "id": "Bu5GtxDyPMW5" }, @@ -114,7 +114,7 @@ }, { "cell_type": "code", - "execution_count": 6, + "execution_count": 3, "metadata": { "id": "FljvS0QcPPTg" }, @@ -173,7 +173,7 @@ }, { "cell_type": "code", - "execution_count": 7, + "execution_count": 4, "metadata": { "id": "QXPgWNCRPRd4" }, @@ -222,7 +222,7 @@ }, { "cell_type": "code", - "execution_count": 9, + "execution_count": 5, "metadata": { "id": "UsdJlkLkRRbp" }, @@ -279,7 +279,7 @@ }, { "cell_type": "code", - "execution_count": 10, + "execution_count": 6, "metadata": { "id": "EDwtthksNUpw" }, @@ -325,7 +325,7 @@ }, { "cell_type": "code", - "execution_count": 12, + "execution_count": 7, "metadata": { "id": "u2xvlBoZPTyx" }, @@ -418,8 +418,8 @@ "config = argparse.Namespace(\n", " batch_size=64, \n", " test_batch_size=1000, \n", - " epochs=5, \n", - " lr=0.001,\n", + " epochs=3, \n", + " lr=0.01,\n", " gamma=0.7,\n", " no_cuda=False,\n", " dry_run=False,\n", @@ -436,619 +436,15 @@ " train_model(config, model, phase = \"baseline\", history = history)\n", " return history\n", "\n", - "history_regular_mnist = train_regular_mnist()\n", - "history_regular_mnist" + "# Uncomment to train\n", + "#history_regular_mnist = train_regular_mnist()\n", + "#history_regular_mnist" ], "metadata": { - "colab": { - "base_uri": "https://localhost:8080/" - }, - "id": "SK-GNifLPN2S", - "outputId": "9cd9a6a2-9b54-46c8-a072-fcd66b995364" + "id": "SK-GNifLPN2S" }, - "execution_count": 14, - "outputs": [ - { - "output_type": "stream", - "name": "stdout", - "text": [ - "Train Epoch: 1 [0/60000 (0%)]\tLoss: 2.295775\n", - "Train Epoch: 1 [640/60000 (1%)]\tLoss: 2.290210\n", - "Train Epoch: 1 [1280/60000 (2%)]\tLoss: 2.310344\n", - "Train Epoch: 1 [1920/60000 (3%)]\tLoss: 2.292868\n", - "Train Epoch: 1 [2560/60000 (4%)]\tLoss: 2.290216\n", - "Train Epoch: 1 [3200/60000 (5%)]\tLoss: 2.276424\n", - "Train Epoch: 1 [3840/60000 (6%)]\tLoss: 2.281419\n", - "Train Epoch: 1 [4480/60000 (7%)]\tLoss: 2.276124\n", - "Train Epoch: 1 [5120/60000 (9%)]\tLoss: 2.267236\n", - "Train Epoch: 1 [5760/60000 (10%)]\tLoss: 2.294219\n", - "Train Epoch: 1 [6400/60000 (11%)]\tLoss: 2.254271\n", - "Train Epoch: 1 [7040/60000 (12%)]\tLoss: 2.264095\n", - "Train Epoch: 1 [7680/60000 (13%)]\tLoss: 2.256358\n", - "Train Epoch: 1 [8320/60000 (14%)]\tLoss: 2.274228\n", - "Train Epoch: 1 [8960/60000 (15%)]\tLoss: 2.269273\n", - "Train Epoch: 1 [9600/60000 (16%)]\tLoss: 2.240185\n", - "Train Epoch: 1 [10240/60000 (17%)]\tLoss: 2.248815\n", - "Train Epoch: 1 [10880/60000 (18%)]\tLoss: 2.223281\n", - "Train Epoch: 1 [11520/60000 (19%)]\tLoss: 2.222255\n", - "Train Epoch: 1 [12160/60000 (20%)]\tLoss: 2.233015\n", - "Train Epoch: 1 [12800/60000 (21%)]\tLoss: 2.211506\n", - "Train Epoch: 1 [13440/60000 (22%)]\tLoss: 2.234103\n", - "Train Epoch: 1 [14080/60000 (23%)]\tLoss: 2.225921\n", - "Train Epoch: 1 [14720/60000 (25%)]\tLoss: 2.202645\n", - "Train Epoch: 1 [15360/60000 (26%)]\tLoss: 2.196408\n", - "Train Epoch: 1 [16000/60000 (27%)]\tLoss: 2.202403\n", - "Train Epoch: 1 [16640/60000 (28%)]\tLoss: 2.209469\n", - "Train Epoch: 1 [17280/60000 (29%)]\tLoss: 2.180980\n", - "Train Epoch: 1 [17920/60000 (30%)]\tLoss: 2.153812\n", - "Train Epoch: 1 [18560/60000 (31%)]\tLoss: 2.150105\n", - "Train Epoch: 1 [19200/60000 (32%)]\tLoss: 2.158034\n", - "Train Epoch: 1 [19840/60000 (33%)]\tLoss: 2.172502\n", - "Train Epoch: 1 [20480/60000 (34%)]\tLoss: 2.093013\n", - "Train Epoch: 1 [21120/60000 (35%)]\tLoss: 2.130392\n", - "Train Epoch: 1 [21760/60000 (36%)]\tLoss: 2.172241\n", - "Train Epoch: 1 [22400/60000 (37%)]\tLoss: 2.162427\n", - "Train Epoch: 1 [23040/60000 (38%)]\tLoss: 2.168904\n", - "Train Epoch: 1 [23680/60000 (39%)]\tLoss: 2.179659\n", - "Train Epoch: 1 [24320/60000 (41%)]\tLoss: 2.163229\n", - "Train Epoch: 1 [24960/60000 (42%)]\tLoss: 2.126366\n", - "Train Epoch: 1 [25600/60000 (43%)]\tLoss: 2.138455\n", - "Train Epoch: 1 [26240/60000 (44%)]\tLoss: 2.113500\n", - "Train Epoch: 1 [26880/60000 (45%)]\tLoss: 2.067201\n", - "Train Epoch: 1 [27520/60000 (46%)]\tLoss: 2.114285\n", - "Train Epoch: 1 [28160/60000 (47%)]\tLoss: 2.036888\n", - "Train Epoch: 1 [28800/60000 (48%)]\tLoss: 2.068524\n", - "Train Epoch: 1 [29440/60000 (49%)]\tLoss: 2.097640\n", - "Train Epoch: 1 [30080/60000 (50%)]\tLoss: 2.028418\n", - "Train Epoch: 1 [30720/60000 (51%)]\tLoss: 2.031548\n", - "Train Epoch: 1 [31360/60000 (52%)]\tLoss: 2.051078\n", - "Train Epoch: 1 [32000/60000 (53%)]\tLoss: 2.028303\n", - "Train Epoch: 1 [32640/60000 (54%)]\tLoss: 1.983975\n", - "Train Epoch: 1 [33280/60000 (55%)]\tLoss: 2.043919\n", - "Train Epoch: 1 [33920/60000 (57%)]\tLoss: 1.980050\n", - "Train Epoch: 1 [34560/60000 (58%)]\tLoss: 1.970208\n", - "Train Epoch: 1 [35200/60000 (59%)]\tLoss: 2.048699\n", - "Train Epoch: 1 [35840/60000 (60%)]\tLoss: 1.956716\n", - "Train Epoch: 1 [36480/60000 (61%)]\tLoss: 1.987072\n", - "Train Epoch: 1 [37120/60000 (62%)]\tLoss: 1.984343\n", - "Train Epoch: 1 [37760/60000 (63%)]\tLoss: 1.947972\n", - "Train Epoch: 1 [38400/60000 (64%)]\tLoss: 1.938421\n", - "Train Epoch: 1 [39040/60000 (65%)]\tLoss: 1.919820\n", - "Train Epoch: 1 [39680/60000 (66%)]\tLoss: 1.931831\n", - "Train Epoch: 1 [40320/60000 (67%)]\tLoss: 1.953799\n", - "Train Epoch: 1 [40960/60000 (68%)]\tLoss: 1.883609\n", - "Train Epoch: 1 [41600/60000 (69%)]\tLoss: 1.876115\n", - "Train Epoch: 1 [42240/60000 (70%)]\tLoss: 1.870510\n", - "Train Epoch: 1 [42880/60000 (71%)]\tLoss: 1.910781\n", - "Train Epoch: 1 [43520/60000 (72%)]\tLoss: 1.950781\n", - "Train Epoch: 1 [44160/60000 (74%)]\tLoss: 1.985367\n", - "Train Epoch: 1 [44800/60000 (75%)]\tLoss: 1.823831\n", - "Train Epoch: 1 [45440/60000 (76%)]\tLoss: 1.870280\n", - "Train Epoch: 1 [46080/60000 (77%)]\tLoss: 1.794647\n", - "Train Epoch: 1 [46720/60000 (78%)]\tLoss: 1.864569\n", - "Train Epoch: 1 [47360/60000 (79%)]\tLoss: 1.871643\n", - "Train Epoch: 1 [48000/60000 (80%)]\tLoss: 1.794408\n", - "Train Epoch: 1 [48640/60000 (81%)]\tLoss: 1.836012\n", - "Train Epoch: 1 [49280/60000 (82%)]\tLoss: 1.784632\n", - "Train Epoch: 1 [49920/60000 (83%)]\tLoss: 1.775053\n", - "Train Epoch: 1 [50560/60000 (84%)]\tLoss: 1.691660\n", - "Train Epoch: 1 [51200/60000 (85%)]\tLoss: 1.818502\n", - "Train Epoch: 1 [51840/60000 (86%)]\tLoss: 1.792987\n", - "Train Epoch: 1 [52480/60000 (87%)]\tLoss: 1.763221\n", - "Train Epoch: 1 [53120/60000 (88%)]\tLoss: 1.779346\n", - "Train Epoch: 1 [53760/60000 (90%)]\tLoss: 1.678108\n", - "Train Epoch: 1 [54400/60000 (91%)]\tLoss: 1.780516\n", - "Train Epoch: 1 [55040/60000 (92%)]\tLoss: 1.650490\n", - "Train Epoch: 1 [55680/60000 (93%)]\tLoss: 1.704799\n", - "Train Epoch: 1 [56320/60000 (94%)]\tLoss: 1.720001\n", - "Train Epoch: 1 [56960/60000 (95%)]\tLoss: 1.716193\n", - "Train Epoch: 1 [57600/60000 (96%)]\tLoss: 1.665386\n", - "Train Epoch: 1 [58240/60000 (97%)]\tLoss: 1.669093\n", - "Train Epoch: 1 [58880/60000 (98%)]\tLoss: 1.669740\n", - "Train Epoch: 1 [59520/60000 (99%)]\tLoss: 1.576309\n", - "\n", - "Test set: Average loss: 1.5640\n", - "Class 0 accuracy: 942.0/980(96%)\n", - "Class 1 accuracy: 1049.0/1135(92%)\n", - "Class 2 accuracy: 530.0/1032(51%)\n", - "Class 3 accuracy: 928.0/1010(92%)\n", - "Class 4 accuracy: 747.0/982(76%)\n", - "Class 5 accuracy: 299.0/892(34%)\n", - "Class 6 accuracy: 880.0/958(92%)\n", - "Class 7 accuracy: 851.0/1028(83%)\n", - "Class 8 accuracy: 744.0/974(76%)\n", - "Class 9 accuracy: 788.0/1009(78%)\n", - "Train Epoch: 2 [0/60000 (0%)]\tLoss: 1.627061\n", - "Train Epoch: 2 [640/60000 (1%)]\tLoss: 1.545597\n", - "Train Epoch: 2 [1280/60000 (2%)]\tLoss: 1.698457\n", - "Train Epoch: 2 [1920/60000 (3%)]\tLoss: 1.572205\n", - "Train Epoch: 2 [2560/60000 (4%)]\tLoss: 1.636262\n", - "Train Epoch: 2 [3200/60000 (5%)]\tLoss: 1.641547\n", - "Train Epoch: 2 [3840/60000 (6%)]\tLoss: 1.528854\n", - "Train Epoch: 2 [4480/60000 (7%)]\tLoss: 1.606497\n", - "Train Epoch: 2 [5120/60000 (9%)]\tLoss: 1.548691\n", - "Train Epoch: 2 [5760/60000 (10%)]\tLoss: 1.562155\n", - "Train Epoch: 2 [6400/60000 (11%)]\tLoss: 1.498272\n", - "Train Epoch: 2 [7040/60000 (12%)]\tLoss: 1.519710\n", - "Train Epoch: 2 [7680/60000 (13%)]\tLoss: 1.605046\n", - "Train Epoch: 2 [8320/60000 (14%)]\tLoss: 1.567077\n", - "Train Epoch: 2 [8960/60000 (15%)]\tLoss: 1.434826\n", - "Train Epoch: 2 [9600/60000 (16%)]\tLoss: 1.478333\n", - "Train Epoch: 2 [10240/60000 (17%)]\tLoss: 1.479111\n", - "Train Epoch: 2 [10880/60000 (18%)]\tLoss: 1.503707\n", - "Train Epoch: 2 [11520/60000 (19%)]\tLoss: 1.373165\n", - "Train Epoch: 2 [12160/60000 (20%)]\tLoss: 1.460236\n", - "Train Epoch: 2 [12800/60000 (21%)]\tLoss: 1.565628\n", - "Train Epoch: 2 [13440/60000 (22%)]\tLoss: 1.565041\n", - "Train Epoch: 2 [14080/60000 (23%)]\tLoss: 1.426577\n", - "Train Epoch: 2 [14720/60000 (25%)]\tLoss: 1.531582\n", - "Train Epoch: 2 [15360/60000 (26%)]\tLoss: 1.427804\n", - "Train Epoch: 2 [16000/60000 (27%)]\tLoss: 1.453471\n", - "Train Epoch: 2 [16640/60000 (28%)]\tLoss: 1.528445\n", - "Train Epoch: 2 [17280/60000 (29%)]\tLoss: 1.515689\n", - "Train Epoch: 2 [17920/60000 (30%)]\tLoss: 1.517196\n", - "Train Epoch: 2 [18560/60000 (31%)]\tLoss: 1.446620\n", - "Train Epoch: 2 [19200/60000 (32%)]\tLoss: 1.496210\n", - "Train Epoch: 2 [19840/60000 (33%)]\tLoss: 1.423505\n", - "Train Epoch: 2 [20480/60000 (34%)]\tLoss: 1.415124\n", - "Train Epoch: 2 [21120/60000 (35%)]\tLoss: 1.544892\n", - "Train Epoch: 2 [21760/60000 (36%)]\tLoss: 1.340283\n", - "Train Epoch: 2 [22400/60000 (37%)]\tLoss: 1.363816\n", - "Train Epoch: 2 [23040/60000 (38%)]\tLoss: 1.382646\n", - "Train Epoch: 2 [23680/60000 (39%)]\tLoss: 1.264206\n", - "Train Epoch: 2 [24320/60000 (41%)]\tLoss: 1.332618\n", - "Train Epoch: 2 [24960/60000 (42%)]\tLoss: 1.358470\n", - "Train Epoch: 2 [25600/60000 (43%)]\tLoss: 1.344868\n", - "Train Epoch: 2 [26240/60000 (44%)]\tLoss: 1.327641\n", - "Train Epoch: 2 [26880/60000 (45%)]\tLoss: 1.382141\n", - "Train Epoch: 2 [27520/60000 (46%)]\tLoss: 1.403416\n", - "Train Epoch: 2 [28160/60000 (47%)]\tLoss: 1.420001\n", - "Train Epoch: 2 [28800/60000 (48%)]\tLoss: 1.414284\n", - "Train Epoch: 2 [29440/60000 (49%)]\tLoss: 1.367697\n", - "Train Epoch: 2 [30080/60000 (50%)]\tLoss: 1.498880\n", - "Train Epoch: 2 [30720/60000 (51%)]\tLoss: 1.278797\n", - "Train Epoch: 2 [31360/60000 (52%)]\tLoss: 1.333852\n", - "Train Epoch: 2 [32000/60000 (53%)]\tLoss: 1.370776\n", - "Train Epoch: 2 [32640/60000 (54%)]\tLoss: 1.062860\n", - "Train Epoch: 2 [33280/60000 (55%)]\tLoss: 1.245440\n", - "Train Epoch: 2 [33920/60000 (57%)]\tLoss: 1.152776\n", - "Train Epoch: 2 [34560/60000 (58%)]\tLoss: 1.344226\n", - "Train Epoch: 2 [35200/60000 (59%)]\tLoss: 1.242468\n", - "Train Epoch: 2 [35840/60000 (60%)]\tLoss: 1.353402\n", - "Train Epoch: 2 [36480/60000 (61%)]\tLoss: 1.166169\n", - "Train Epoch: 2 [37120/60000 (62%)]\tLoss: 1.165925\n", - "Train Epoch: 2 [37760/60000 (63%)]\tLoss: 1.237298\n", - "Train Epoch: 2 [38400/60000 (64%)]\tLoss: 1.209161\n", - "Train Epoch: 2 [39040/60000 (65%)]\tLoss: 1.284919\n", - "Train Epoch: 2 [39680/60000 (66%)]\tLoss: 1.301399\n", - "Train Epoch: 2 [40320/60000 (67%)]\tLoss: 1.257363\n", - "Train Epoch: 2 [40960/60000 (68%)]\tLoss: 1.199494\n", - "Train Epoch: 2 [41600/60000 (69%)]\tLoss: 1.113902\n", - "Train Epoch: 2 [42240/60000 (70%)]\tLoss: 1.155495\n", - "Train Epoch: 2 [42880/60000 (71%)]\tLoss: 1.227993\n", - "Train Epoch: 2 [43520/60000 (72%)]\tLoss: 1.231888\n", - "Train Epoch: 2 [44160/60000 (74%)]\tLoss: 1.373095\n", - "Train Epoch: 2 [44800/60000 (75%)]\tLoss: 1.248195\n", - "Train Epoch: 2 [45440/60000 (76%)]\tLoss: 1.127467\n", - "Train Epoch: 2 [46080/60000 (77%)]\tLoss: 1.045080\n", - "Train Epoch: 2 [46720/60000 (78%)]\tLoss: 1.206602\n", - "Train Epoch: 2 [47360/60000 (79%)]\tLoss: 1.128123\n", - "Train Epoch: 2 [48000/60000 (80%)]\tLoss: 1.348677\n", - "Train Epoch: 2 [48640/60000 (81%)]\tLoss: 1.197632\n", - "Train Epoch: 2 [49280/60000 (82%)]\tLoss: 1.165728\n", - "Train Epoch: 2 [49920/60000 (83%)]\tLoss: 1.209910\n", - "Train Epoch: 2 [50560/60000 (84%)]\tLoss: 1.137662\n", - "Train Epoch: 2 [51200/60000 (85%)]\tLoss: 1.109170\n", - "Train Epoch: 2 [51840/60000 (86%)]\tLoss: 1.038135\n", - "Train Epoch: 2 [52480/60000 (87%)]\tLoss: 1.092770\n", - "Train Epoch: 2 [53120/60000 (88%)]\tLoss: 1.205910\n", - "Train Epoch: 2 [53760/60000 (90%)]\tLoss: 0.988055\n", - "Train Epoch: 2 [54400/60000 (91%)]\tLoss: 1.205869\n", - "Train Epoch: 2 [55040/60000 (92%)]\tLoss: 1.149507\n", - "Train Epoch: 2 [55680/60000 (93%)]\tLoss: 1.059419\n", - "Train Epoch: 2 [56320/60000 (94%)]\tLoss: 1.130637\n", - "Train Epoch: 2 [56960/60000 (95%)]\tLoss: 1.067291\n", - "Train Epoch: 2 [57600/60000 (96%)]\tLoss: 1.102901\n", - "Train Epoch: 2 [58240/60000 (97%)]\tLoss: 1.082644\n", - "Train Epoch: 2 [58880/60000 (98%)]\tLoss: 1.176209\n", - "Train Epoch: 2 [59520/60000 (99%)]\tLoss: 1.100892\n", - "\n", - "Test set: Average loss: 0.9323\n", - "Class 0 accuracy: 937.0/980(96%)\n", - "Class 1 accuracy: 1083.0/1135(95%)\n", - "Class 2 accuracy: 748.0/1032(72%)\n", - "Class 3 accuracy: 923.0/1010(91%)\n", - "Class 4 accuracy: 826.0/982(84%)\n", - "Class 5 accuracy: 470.0/892(53%)\n", - "Class 6 accuracy: 886.0/958(92%)\n", - "Class 7 accuracy: 898.0/1028(87%)\n", - "Class 8 accuracy: 732.0/974(75%)\n", - "Class 9 accuracy: 844.0/1009(84%)\n", - "Train Epoch: 3 [0/60000 (0%)]\tLoss: 1.117987\n", - "Train Epoch: 3 [640/60000 (1%)]\tLoss: 1.044462\n", - "Train Epoch: 3 [1280/60000 (2%)]\tLoss: 1.027436\n", - "Train Epoch: 3 [1920/60000 (3%)]\tLoss: 1.230957\n", - "Train Epoch: 3 [2560/60000 (4%)]\tLoss: 1.004591\n", - "Train Epoch: 3 [3200/60000 (5%)]\tLoss: 1.060180\n", - "Train Epoch: 3 [3840/60000 (6%)]\tLoss: 0.902412\n", - "Train Epoch: 3 [4480/60000 (7%)]\tLoss: 0.957223\n", - "Train Epoch: 3 [5120/60000 (9%)]\tLoss: 1.091123\n", - "Train Epoch: 3 [5760/60000 (10%)]\tLoss: 1.175083\n", - "Train Epoch: 3 [6400/60000 (11%)]\tLoss: 0.969085\n", - "Train Epoch: 3 [7040/60000 (12%)]\tLoss: 1.044883\n", - "Train Epoch: 3 [7680/60000 (13%)]\tLoss: 1.010503\n", - "Train Epoch: 3 [8320/60000 (14%)]\tLoss: 1.037116\n", - "Train Epoch: 3 [8960/60000 (15%)]\tLoss: 0.968517\n", - "Train Epoch: 3 [9600/60000 (16%)]\tLoss: 1.037061\n", - "Train Epoch: 3 [10240/60000 (17%)]\tLoss: 0.992225\n", - "Train Epoch: 3 [10880/60000 (18%)]\tLoss: 1.091760\n", - "Train Epoch: 3 [11520/60000 (19%)]\tLoss: 1.100666\n", - "Train Epoch: 3 [12160/60000 (20%)]\tLoss: 0.852405\n", - "Train Epoch: 3 [12800/60000 (21%)]\tLoss: 0.957409\n", - "Train Epoch: 3 [13440/60000 (22%)]\tLoss: 0.959758\n", - "Train Epoch: 3 [14080/60000 (23%)]\tLoss: 0.998838\n", - "Train Epoch: 3 [14720/60000 (25%)]\tLoss: 1.045380\n", - "Train Epoch: 3 [15360/60000 (26%)]\tLoss: 0.842424\n", - "Train Epoch: 3 [16000/60000 (27%)]\tLoss: 1.003876\n", - "Train Epoch: 3 [16640/60000 (28%)]\tLoss: 0.948943\n", - "Train Epoch: 3 [17280/60000 (29%)]\tLoss: 1.090439\n", - "Train Epoch: 3 [17920/60000 (30%)]\tLoss: 1.087915\n", - "Train Epoch: 3 [18560/60000 (31%)]\tLoss: 1.145274\n", - "Train Epoch: 3 [19200/60000 (32%)]\tLoss: 1.217145\n", - "Train Epoch: 3 [19840/60000 (33%)]\tLoss: 1.085176\n", - "Train Epoch: 3 [20480/60000 (34%)]\tLoss: 1.083079\n", - "Train Epoch: 3 [21120/60000 (35%)]\tLoss: 0.999794\n", - "Train Epoch: 3 [21760/60000 (36%)]\tLoss: 0.911105\n", - "Train Epoch: 3 [22400/60000 (37%)]\tLoss: 1.273139\n", - "Train Epoch: 3 [23040/60000 (38%)]\tLoss: 1.048052\n", - "Train Epoch: 3 [23680/60000 (39%)]\tLoss: 0.818689\n", - "Train Epoch: 3 [24320/60000 (41%)]\tLoss: 0.858526\n", - "Train Epoch: 3 [24960/60000 (42%)]\tLoss: 0.982630\n", - "Train Epoch: 3 [25600/60000 (43%)]\tLoss: 1.042941\n", - "Train Epoch: 3 [26240/60000 (44%)]\tLoss: 0.818404\n", - "Train Epoch: 3 [26880/60000 (45%)]\tLoss: 0.947276\n", - "Train Epoch: 3 [27520/60000 (46%)]\tLoss: 0.990826\n", - "Train Epoch: 3 [28160/60000 (47%)]\tLoss: 0.956242\n", - "Train Epoch: 3 [28800/60000 (48%)]\tLoss: 1.052988\n", - "Train Epoch: 3 [29440/60000 (49%)]\tLoss: 1.157221\n", - "Train Epoch: 3 [30080/60000 (50%)]\tLoss: 0.913521\n", - "Train Epoch: 3 [30720/60000 (51%)]\tLoss: 1.009682\n", - "Train Epoch: 3 [31360/60000 (52%)]\tLoss: 0.770679\n", - "Train Epoch: 3 [32000/60000 (53%)]\tLoss: 0.990214\n", - "Train Epoch: 3 [32640/60000 (54%)]\tLoss: 0.937079\n", - "Train Epoch: 3 [33280/60000 (55%)]\tLoss: 0.872119\n", - "Train Epoch: 3 [33920/60000 (57%)]\tLoss: 0.840864\n", - "Train Epoch: 3 [34560/60000 (58%)]\tLoss: 1.002336\n", - "Train Epoch: 3 [35200/60000 (59%)]\tLoss: 0.915164\n", - "Train Epoch: 3 [35840/60000 (60%)]\tLoss: 1.012089\n", - "Train Epoch: 3 [36480/60000 (61%)]\tLoss: 0.939280\n", - "Train Epoch: 3 [37120/60000 (62%)]\tLoss: 1.060541\n", - "Train Epoch: 3 [37760/60000 (63%)]\tLoss: 0.937920\n", - "Train Epoch: 3 [38400/60000 (64%)]\tLoss: 1.006945\n", - "Train Epoch: 3 [39040/60000 (65%)]\tLoss: 1.078756\n", - "Train Epoch: 3 [39680/60000 (66%)]\tLoss: 1.017594\n", - "Train Epoch: 3 [40320/60000 (67%)]\tLoss: 1.033234\n", - "Train Epoch: 3 [40960/60000 (68%)]\tLoss: 1.230211\n", - "Train Epoch: 3 [41600/60000 (69%)]\tLoss: 0.684275\n", - "Train Epoch: 3 [42240/60000 (70%)]\tLoss: 1.083214\n", - "Train Epoch: 3 [42880/60000 (71%)]\tLoss: 0.852170\n", - "Train Epoch: 3 [43520/60000 (72%)]\tLoss: 0.995445\n", - "Train Epoch: 3 [44160/60000 (74%)]\tLoss: 0.790355\n", - "Train Epoch: 3 [44800/60000 (75%)]\tLoss: 0.920374\n", - "Train Epoch: 3 [45440/60000 (76%)]\tLoss: 1.090557\n", - "Train Epoch: 3 [46080/60000 (77%)]\tLoss: 0.755298\n", - "Train Epoch: 3 [46720/60000 (78%)]\tLoss: 1.101079\n", - "Train Epoch: 3 [47360/60000 (79%)]\tLoss: 0.719922\n", - "Train Epoch: 3 [48000/60000 (80%)]\tLoss: 0.805579\n", - "Train Epoch: 3 [48640/60000 (81%)]\tLoss: 0.866616\n", - "Train Epoch: 3 [49280/60000 (82%)]\tLoss: 0.777545\n", - "Train Epoch: 3 [49920/60000 (83%)]\tLoss: 0.800337\n", - "Train Epoch: 3 [50560/60000 (84%)]\tLoss: 0.921025\n", - "Train Epoch: 3 [51200/60000 (85%)]\tLoss: 0.961804\n", - "Train Epoch: 3 [51840/60000 (86%)]\tLoss: 0.882696\n", - "Train Epoch: 3 [52480/60000 (87%)]\tLoss: 0.849839\n", - "Train Epoch: 3 [53120/60000 (88%)]\tLoss: 0.893887\n", - "Train Epoch: 3 [53760/60000 (90%)]\tLoss: 0.815971\n", - "Train Epoch: 3 [54400/60000 (91%)]\tLoss: 1.109305\n", - "Train Epoch: 3 [55040/60000 (92%)]\tLoss: 0.864345\n", - "Train Epoch: 3 [55680/60000 (93%)]\tLoss: 0.969730\n", - "Train Epoch: 3 [56320/60000 (94%)]\tLoss: 0.959234\n", - "Train Epoch: 3 [56960/60000 (95%)]\tLoss: 0.954617\n", - "Train Epoch: 3 [57600/60000 (96%)]\tLoss: 0.790892\n", - "Train Epoch: 3 [58240/60000 (97%)]\tLoss: 1.002821\n", - "Train Epoch: 3 [58880/60000 (98%)]\tLoss: 0.799075\n", - "Train Epoch: 3 [59520/60000 (99%)]\tLoss: 0.859415\n", - "\n", - "Test set: Average loss: 0.7067\n", - "Class 0 accuracy: 942.0/980(96%)\n", - "Class 1 accuracy: 1085.0/1135(96%)\n", - "Class 2 accuracy: 815.0/1032(79%)\n", - "Class 3 accuracy: 909.0/1010(90%)\n", - "Class 4 accuracy: 844.0/982(86%)\n", - "Class 5 accuracy: 572.0/892(64%)\n", - "Class 6 accuracy: 881.0/958(92%)\n", - "Class 7 accuracy: 895.0/1028(87%)\n", - "Class 8 accuracy: 773.0/974(79%)\n", - "Class 9 accuracy: 861.0/1009(85%)\n", - "Train Epoch: 4 [0/60000 (0%)]\tLoss: 0.921860\n", - "Train Epoch: 4 [640/60000 (1%)]\tLoss: 1.006901\n", - "Train Epoch: 4 [1280/60000 (2%)]\tLoss: 0.829744\n", - "Train Epoch: 4 [1920/60000 (3%)]\tLoss: 0.958730\n", - "Train Epoch: 4 [2560/60000 (4%)]\tLoss: 0.908768\n", - "Train Epoch: 4 [3200/60000 (5%)]\tLoss: 0.809689\n", - "Train Epoch: 4 [3840/60000 (6%)]\tLoss: 0.864438\n", - "Train Epoch: 4 [4480/60000 (7%)]\tLoss: 0.871907\n", - "Train Epoch: 4 [5120/60000 (9%)]\tLoss: 0.879927\n", - "Train Epoch: 4 [5760/60000 (10%)]\tLoss: 0.958960\n", - "Train Epoch: 4 [6400/60000 (11%)]\tLoss: 0.866098\n", - "Train Epoch: 4 [7040/60000 (12%)]\tLoss: 1.041393\n", - "Train Epoch: 4 [7680/60000 (13%)]\tLoss: 0.813019\n", - "Train Epoch: 4 [8320/60000 (14%)]\tLoss: 0.767784\n", - "Train Epoch: 4 [8960/60000 (15%)]\tLoss: 0.933339\n", - "Train Epoch: 4 [9600/60000 (16%)]\tLoss: 0.821877\n", - "Train Epoch: 4 [10240/60000 (17%)]\tLoss: 0.826119\n", - "Train Epoch: 4 [10880/60000 (18%)]\tLoss: 0.772280\n", - "Train Epoch: 4 [11520/60000 (19%)]\tLoss: 0.868618\n", - "Train Epoch: 4 [12160/60000 (20%)]\tLoss: 1.034466\n", - "Train Epoch: 4 [12800/60000 (21%)]\tLoss: 0.872086\n", - "Train Epoch: 4 [13440/60000 (22%)]\tLoss: 0.912373\n", - "Train Epoch: 4 [14080/60000 (23%)]\tLoss: 0.870299\n", - "Train Epoch: 4 [14720/60000 (25%)]\tLoss: 0.731594\n", - "Train Epoch: 4 [15360/60000 (26%)]\tLoss: 1.079396\n", - "Train Epoch: 4 [16000/60000 (27%)]\tLoss: 0.882126\n", - "Train Epoch: 4 [16640/60000 (28%)]\tLoss: 0.682331\n", - "Train Epoch: 4 [17280/60000 (29%)]\tLoss: 1.029123\n", - "Train Epoch: 4 [17920/60000 (30%)]\tLoss: 0.596465\n", - "Train Epoch: 4 [18560/60000 (31%)]\tLoss: 0.813218\n", - "Train Epoch: 4 [19200/60000 (32%)]\tLoss: 0.747696\n", - "Train Epoch: 4 [19840/60000 (33%)]\tLoss: 0.880849\n", - "Train Epoch: 4 [20480/60000 (34%)]\tLoss: 0.734443\n", - "Train Epoch: 4 [21120/60000 (35%)]\tLoss: 0.840509\n", - "Train Epoch: 4 [21760/60000 (36%)]\tLoss: 0.745489\n", - "Train Epoch: 4 [22400/60000 (37%)]\tLoss: 0.841733\n", - "Train Epoch: 4 [23040/60000 (38%)]\tLoss: 0.920951\n", - "Train Epoch: 4 [23680/60000 (39%)]\tLoss: 0.924071\n", - "Train Epoch: 4 [24320/60000 (41%)]\tLoss: 0.906279\n", - "Train Epoch: 4 [24960/60000 (42%)]\tLoss: 0.867031\n", - "Train Epoch: 4 [25600/60000 (43%)]\tLoss: 0.946203\n", - "Train Epoch: 4 [26240/60000 (44%)]\tLoss: 0.989663\n", - "Train Epoch: 4 [26880/60000 (45%)]\tLoss: 0.839466\n", - "Train Epoch: 4 [27520/60000 (46%)]\tLoss: 0.843587\n", - "Train Epoch: 4 [28160/60000 (47%)]\tLoss: 0.737129\n", - "Train Epoch: 4 [28800/60000 (48%)]\tLoss: 0.807360\n", - "Train Epoch: 4 [29440/60000 (49%)]\tLoss: 0.823521\n", - "Train Epoch: 4 [30080/60000 (50%)]\tLoss: 0.841337\n", - "Train Epoch: 4 [30720/60000 (51%)]\tLoss: 0.999043\n", - "Train Epoch: 4 [31360/60000 (52%)]\tLoss: 0.962988\n", - "Train Epoch: 4 [32000/60000 (53%)]\tLoss: 1.040999\n", - "Train Epoch: 4 [32640/60000 (54%)]\tLoss: 0.750595\n", - "Train Epoch: 4 [33280/60000 (55%)]\tLoss: 0.904500\n", - "Train Epoch: 4 [33920/60000 (57%)]\tLoss: 0.716458\n", - "Train Epoch: 4 [34560/60000 (58%)]\tLoss: 0.917832\n", - "Train Epoch: 4 [35200/60000 (59%)]\tLoss: 0.834955\n", - "Train Epoch: 4 [35840/60000 (60%)]\tLoss: 0.833779\n", - "Train Epoch: 4 [36480/60000 (61%)]\tLoss: 0.798480\n", - "Train Epoch: 4 [37120/60000 (62%)]\tLoss: 0.718178\n", - "Train Epoch: 4 [37760/60000 (63%)]\tLoss: 0.774633\n", - "Train Epoch: 4 [38400/60000 (64%)]\tLoss: 0.640932\n", - "Train Epoch: 4 [39040/60000 (65%)]\tLoss: 0.761126\n", - "Train Epoch: 4 [39680/60000 (66%)]\tLoss: 0.567800\n", - "Train Epoch: 4 [40320/60000 (67%)]\tLoss: 0.731927\n", - "Train Epoch: 4 [40960/60000 (68%)]\tLoss: 0.972790\n", - "Train Epoch: 4 [41600/60000 (69%)]\tLoss: 0.913961\n", - "Train Epoch: 4 [42240/60000 (70%)]\tLoss: 0.630956\n", - "Train Epoch: 4 [42880/60000 (71%)]\tLoss: 0.928092\n", - "Train Epoch: 4 [43520/60000 (72%)]\tLoss: 0.749575\n", - "Train Epoch: 4 [44160/60000 (74%)]\tLoss: 0.970667\n", - "Train Epoch: 4 [44800/60000 (75%)]\tLoss: 0.804512\n", - "Train Epoch: 4 [45440/60000 (76%)]\tLoss: 0.832241\n", - "Train Epoch: 4 [46080/60000 (77%)]\tLoss: 0.851197\n", - "Train Epoch: 4 [46720/60000 (78%)]\tLoss: 0.918072\n", - "Train Epoch: 4 [47360/60000 (79%)]\tLoss: 0.886158\n", - "Train Epoch: 4 [48000/60000 (80%)]\tLoss: 0.803933\n", - "Train Epoch: 4 [48640/60000 (81%)]\tLoss: 0.711099\n", - "Train Epoch: 4 [49280/60000 (82%)]\tLoss: 0.786826\n", - "Train Epoch: 4 [49920/60000 (83%)]\tLoss: 0.834988\n", - "Train Epoch: 4 [50560/60000 (84%)]\tLoss: 0.902848\n", - "Train Epoch: 4 [51200/60000 (85%)]\tLoss: 0.838035\n", - "Train Epoch: 4 [51840/60000 (86%)]\tLoss: 0.853425\n", - "Train Epoch: 4 [52480/60000 (87%)]\tLoss: 0.843906\n", - "Train Epoch: 4 [53120/60000 (88%)]\tLoss: 0.782411\n", - "Train Epoch: 4 [53760/60000 (90%)]\tLoss: 0.752052\n", - "Train Epoch: 4 [54400/60000 (91%)]\tLoss: 0.738311\n", - "Train Epoch: 4 [55040/60000 (92%)]\tLoss: 0.929952\n", - "Train Epoch: 4 [55680/60000 (93%)]\tLoss: 0.858274\n", - "Train Epoch: 4 [56320/60000 (94%)]\tLoss: 1.006905\n", - "Train Epoch: 4 [56960/60000 (95%)]\tLoss: 0.824607\n", - "Train Epoch: 4 [57600/60000 (96%)]\tLoss: 0.852737\n", - "Train Epoch: 4 [58240/60000 (97%)]\tLoss: 0.789701\n", - "Train Epoch: 4 [58880/60000 (98%)]\tLoss: 0.821994\n", - "Train Epoch: 4 [59520/60000 (99%)]\tLoss: 0.840377\n", - "\n", - "Test set: Average loss: 0.6137\n", - "Class 0 accuracy: 947.0/980(97%)\n", - "Class 1 accuracy: 1097.0/1135(97%)\n", - "Class 2 accuracy: 840.0/1032(81%)\n", - "Class 3 accuracy: 912.0/1010(90%)\n", - "Class 4 accuracy: 852.0/982(87%)\n", - "Class 5 accuracy: 602.0/892(67%)\n", - "Class 6 accuracy: 879.0/958(92%)\n", - "Class 7 accuracy: 904.0/1028(88%)\n", - "Class 8 accuracy: 770.0/974(79%)\n", - "Class 9 accuracy: 866.0/1009(86%)\n", - "Train Epoch: 5 [0/60000 (0%)]\tLoss: 0.841241\n", - "Train Epoch: 5 [640/60000 (1%)]\tLoss: 0.963371\n", - "Train Epoch: 5 [1280/60000 (2%)]\tLoss: 0.714024\n", - "Train Epoch: 5 [1920/60000 (3%)]\tLoss: 0.760713\n", - "Train Epoch: 5 [2560/60000 (4%)]\tLoss: 0.709700\n", - "Train Epoch: 5 [3200/60000 (5%)]\tLoss: 0.959411\n", - "Train Epoch: 5 [3840/60000 (6%)]\tLoss: 0.823688\n", - "Train Epoch: 5 [4480/60000 (7%)]\tLoss: 0.688386\n", - "Train Epoch: 5 [5120/60000 (9%)]\tLoss: 0.836027\n", - "Train Epoch: 5 [5760/60000 (10%)]\tLoss: 0.814876\n", - "Train Epoch: 5 [6400/60000 (11%)]\tLoss: 0.915517\n", - "Train Epoch: 5 [7040/60000 (12%)]\tLoss: 0.930052\n", - "Train Epoch: 5 [7680/60000 (13%)]\tLoss: 0.713963\n", - "Train Epoch: 5 [8320/60000 (14%)]\tLoss: 0.611171\n", - "Train Epoch: 5 [8960/60000 (15%)]\tLoss: 0.753952\n", - "Train Epoch: 5 [9600/60000 (16%)]\tLoss: 0.753516\n", - "Train Epoch: 5 [10240/60000 (17%)]\tLoss: 0.638662\n", - "Train Epoch: 5 [10880/60000 (18%)]\tLoss: 0.851477\n", - "Train Epoch: 5 [11520/60000 (19%)]\tLoss: 0.748764\n", - "Train Epoch: 5 [12160/60000 (20%)]\tLoss: 0.717946\n", - "Train Epoch: 5 [12800/60000 (21%)]\tLoss: 0.648801\n", - "Train Epoch: 5 [13440/60000 (22%)]\tLoss: 0.817798\n", - "Train Epoch: 5 [14080/60000 (23%)]\tLoss: 1.011557\n", - "Train Epoch: 5 [14720/60000 (25%)]\tLoss: 0.979450\n", - "Train Epoch: 5 [15360/60000 (26%)]\tLoss: 0.741829\n", - "Train Epoch: 5 [16000/60000 (27%)]\tLoss: 0.929305\n", - "Train Epoch: 5 [16640/60000 (28%)]\tLoss: 0.898180\n", - "Train Epoch: 5 [17280/60000 (29%)]\tLoss: 0.682718\n", - "Train Epoch: 5 [17920/60000 (30%)]\tLoss: 0.841480\n", - "Train Epoch: 5 [18560/60000 (31%)]\tLoss: 0.895796\n", - "Train Epoch: 5 [19200/60000 (32%)]\tLoss: 0.707863\n", - "Train Epoch: 5 [19840/60000 (33%)]\tLoss: 0.851275\n", - "Train Epoch: 5 [20480/60000 (34%)]\tLoss: 0.855291\n", - "Train Epoch: 5 [21120/60000 (35%)]\tLoss: 0.851695\n", - "Train Epoch: 5 [21760/60000 (36%)]\tLoss: 0.684048\n", - "Train Epoch: 5 [22400/60000 (37%)]\tLoss: 0.917995\n", - "Train Epoch: 5 [23040/60000 (38%)]\tLoss: 0.765770\n", - "Train Epoch: 5 [23680/60000 (39%)]\tLoss: 0.647655\n", - "Train Epoch: 5 [24320/60000 (41%)]\tLoss: 0.739678\n", - "Train Epoch: 5 [24960/60000 (42%)]\tLoss: 0.672344\n", - "Train Epoch: 5 [25600/60000 (43%)]\tLoss: 0.766927\n", - "Train Epoch: 5 [26240/60000 (44%)]\tLoss: 0.738036\n", - "Train Epoch: 5 [26880/60000 (45%)]\tLoss: 0.852725\n", - "Train Epoch: 5 [27520/60000 (46%)]\tLoss: 0.632756\n", - "Train Epoch: 5 [28160/60000 (47%)]\tLoss: 0.689774\n", - "Train Epoch: 5 [28800/60000 (48%)]\tLoss: 0.674076\n", - "Train Epoch: 5 [29440/60000 (49%)]\tLoss: 0.755838\n", - "Train Epoch: 5 [30080/60000 (50%)]\tLoss: 0.786167\n", - "Train Epoch: 5 [30720/60000 (51%)]\tLoss: 0.804736\n", - "Train Epoch: 5 [31360/60000 (52%)]\tLoss: 0.723398\n", - "Train Epoch: 5 [32000/60000 (53%)]\tLoss: 0.685933\n", - "Train Epoch: 5 [32640/60000 (54%)]\tLoss: 0.808149\n", - "Train Epoch: 5 [33280/60000 (55%)]\tLoss: 0.944384\n", - "Train Epoch: 5 [33920/60000 (57%)]\tLoss: 0.638669\n", - "Train Epoch: 5 [34560/60000 (58%)]\tLoss: 0.683750\n", - "Train Epoch: 5 [35200/60000 (59%)]\tLoss: 0.702595\n", - "Train Epoch: 5 [35840/60000 (60%)]\tLoss: 0.742202\n", - "Train Epoch: 5 [36480/60000 (61%)]\tLoss: 0.761243\n", - "Train Epoch: 5 [37120/60000 (62%)]\tLoss: 0.768657\n", - "Train Epoch: 5 [37760/60000 (63%)]\tLoss: 0.824368\n", - "Train Epoch: 5 [38400/60000 (64%)]\tLoss: 0.657427\n", - "Train Epoch: 5 [39040/60000 (65%)]\tLoss: 0.724466\n", - "Train Epoch: 5 [39680/60000 (66%)]\tLoss: 0.800387\n", - "Train Epoch: 5 [40320/60000 (67%)]\tLoss: 0.812061\n", - "Train Epoch: 5 [40960/60000 (68%)]\tLoss: 0.811920\n", - "Train Epoch: 5 [41600/60000 (69%)]\tLoss: 0.888286\n", - "Train Epoch: 5 [42240/60000 (70%)]\tLoss: 0.691121\n", - "Train Epoch: 5 [42880/60000 (71%)]\tLoss: 0.749742\n", - "Train Epoch: 5 [43520/60000 (72%)]\tLoss: 0.944218\n", - "Train Epoch: 5 [44160/60000 (74%)]\tLoss: 0.698245\n", - "Train Epoch: 5 [44800/60000 (75%)]\tLoss: 0.796792\n", - "Train Epoch: 5 [45440/60000 (76%)]\tLoss: 0.653151\n", - "Train Epoch: 5 [46080/60000 (77%)]\tLoss: 0.813349\n", - "Train Epoch: 5 [46720/60000 (78%)]\tLoss: 0.600790\n", - "Train Epoch: 5 [47360/60000 (79%)]\tLoss: 0.848091\n", - "Train Epoch: 5 [48000/60000 (80%)]\tLoss: 0.636887\n", - "Train Epoch: 5 [48640/60000 (81%)]\tLoss: 0.767468\n", - "Train Epoch: 5 [49280/60000 (82%)]\tLoss: 0.713464\n", - "Train Epoch: 5 [49920/60000 (83%)]\tLoss: 0.635464\n", - "Train Epoch: 5 [50560/60000 (84%)]\tLoss: 0.722847\n", - "Train Epoch: 5 [51200/60000 (85%)]\tLoss: 0.924447\n", - "Train Epoch: 5 [51840/60000 (86%)]\tLoss: 0.738732\n", - "Train Epoch: 5 [52480/60000 (87%)]\tLoss: 0.732151\n", - "Train Epoch: 5 [53120/60000 (88%)]\tLoss: 0.769458\n", - "Train Epoch: 5 [53760/60000 (90%)]\tLoss: 0.761817\n", - "Train Epoch: 5 [54400/60000 (91%)]\tLoss: 0.766024\n", - "Train Epoch: 5 [55040/60000 (92%)]\tLoss: 0.820377\n", - "Train Epoch: 5 [55680/60000 (93%)]\tLoss: 0.713448\n", - "Train Epoch: 5 [56320/60000 (94%)]\tLoss: 0.753411\n", - "Train Epoch: 5 [56960/60000 (95%)]\tLoss: 0.758932\n", - "Train Epoch: 5 [57600/60000 (96%)]\tLoss: 0.690840\n", - "Train Epoch: 5 [58240/60000 (97%)]\tLoss: 0.855213\n", - "Train Epoch: 5 [58880/60000 (98%)]\tLoss: 0.847026\n", - "Train Epoch: 5 [59520/60000 (99%)]\tLoss: 0.714162\n", - "\n", - "Test set: Average loss: 0.5663\n", - "Class 0 accuracy: 949.0/980(97%)\n", - "Class 1 accuracy: 1095.0/1135(96%)\n", - "Class 2 accuracy: 841.0/1032(81%)\n", - "Class 3 accuracy: 909.0/1010(90%)\n", - "Class 4 accuracy: 861.0/982(88%)\n", - "Class 5 accuracy: 630.0/892(71%)\n", - "Class 6 accuracy: 881.0/958(92%)\n", - "Class 7 accuracy: 906.0/1028(88%)\n", - "Class 8 accuracy: 798.0/974(82%)\n", - "Class 9 accuracy: 869.0/1009(86%)\n" - ] - }, - { - "output_type": "execute_result", - "data": { - "text/plain": [ - "[{0: 0.9612244897959183,\n", - " 1: 0.9242290748898678,\n", - " 2: 0.5135658914728682,\n", - " 3: 0.9188118811881189,\n", - " 4: 0.7606924643584522,\n", - " 5: 0.3352017937219731,\n", - " 6: 0.918580375782881,\n", - " 7: 0.8278210116731517,\n", - " 8: 0.7638603696098563,\n", - " 9: 0.7809712586719524,\n", - " 'phase': 'baseline'},\n", - " {0: 0.9561224489795919,\n", - " 1: 0.9541850220264317,\n", - " 2: 0.7248062015503876,\n", - " 3: 0.9138613861386139,\n", - " 4: 0.8411405295315683,\n", - " 5: 0.5269058295964125,\n", - " 6: 0.9248434237995825,\n", - " 7: 0.8735408560311284,\n", - " 8: 0.7515400410677618,\n", - " 9: 0.8364717542120912,\n", - " 'phase': 'baseline'},\n", - " {0: 0.9612244897959183,\n", - " 1: 0.9559471365638766,\n", - " 2: 0.7897286821705426,\n", - " 3: 0.9,\n", - " 4: 0.8594704684317719,\n", - " 5: 0.6412556053811659,\n", - " 6: 0.9196242171189979,\n", - " 7: 0.8706225680933852,\n", - " 8: 0.7936344969199178,\n", - " 9: 0.8533201189296333,\n", - " 'phase': 'baseline'},\n", - " {0: 0.9663265306122449,\n", - " 1: 0.9665198237885463,\n", - " 2: 0.813953488372093,\n", - " 3: 0.902970297029703,\n", - " 4: 0.8676171079429735,\n", - " 5: 0.6748878923766816,\n", - " 6: 0.9175365344467641,\n", - " 7: 0.8793774319066148,\n", - " 8: 0.7905544147843943,\n", - " 9: 0.8582755203171457,\n", - " 'phase': 'baseline'},\n", - " {0: 0.9683673469387755,\n", - " 1: 0.9647577092511013,\n", - " 2: 0.814922480620155,\n", - " 3: 0.9,\n", - " 4: 0.8767820773930753,\n", - " 5: 0.7062780269058296,\n", - " 6: 0.9196242171189979,\n", - " 7: 0.8813229571984436,\n", - " 8: 0.8193018480492813,\n", - " 9: 0.8612487611496531,\n", - " 'phase': 'baseline'}]" - ] - }, - "metadata": {}, - "execution_count": 14 - } - ] + "execution_count": 18, + "outputs": [] }, { "cell_type": "code", @@ -1096,41 +492,41 @@ "history_catastrophic_forgetting" ], "metadata": { + "id": "OnATcaveP3Fi", "colab": { "base_uri": "https://localhost:8080/" }, - "id": "OnATcaveP3Fi", - "outputId": "3864a59d-b604-491d-8697-f4f7d622c1e7" + "outputId": "6e9bc36f-8e10-405a-8297-e104141e58cc" }, - "execution_count": 15, + "execution_count": 19, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ - "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.311233\n", - "Train Epoch: 1 [640/12665 (5%)]\tLoss: 2.246531\n", - "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 2.186137\n", - "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 2.105181\n", - "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 2.048626\n", - "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 1.975536\n", - "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 1.913516\n", - "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 1.818088\n", - "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.744223\n", - "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.696749\n", - "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.615581\n", - "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.508412\n", - "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 1.426383\n", - "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 1.385702\n", - "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 1.271088\n", - "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 1.157527\n", - "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 1.164531\n", - "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 1.056471\n", - "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 1.015163\n", - "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.924486\n", - "\n", - "Test set: Average loss: 2.6919\n", - "Class 0 accuracy: 972.0/980(99%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.295613\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 1.647854\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 1.039609\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.593714\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.321345\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.211062\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.124204\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.082856\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.075962\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.071156\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.117059\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.059726\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.032035\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.033078\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.030728\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.039060\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.035301\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.041941\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.040506\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.014235\n", + "\n", + "Test set: Average loss: 7.1276\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -1140,29 +536,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.725303\n", - "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.845168\n", - "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.872068\n", - "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.699184\n", - "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.702631\n", - "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.649261\n", - "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.638805\n", - "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.584503\n", - "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.612078\n", - "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.522527\n", - "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.505232\n", - "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.500317\n", - "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.420275\n", - "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.444307\n", - "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.431154\n", - "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.426933\n", - "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.428767\n", - "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.397589\n", - "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.332724\n", - "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.391286\n", - "\n", - "Test set: Average loss: 3.6493\n", - "Class 0 accuracy: 970.0/980(99%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.007759\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.029978\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.017544\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.022188\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.009434\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.024381\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.086738\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.020443\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.015766\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.006633\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.007944\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.008917\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.004392\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.008756\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.056707\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.005973\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.008020\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.009416\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.017660\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.010692\n", + "\n", + "Test set: Average loss: 8.1468\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -1172,29 +568,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.367619\n", - "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.309399\n", - "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.296202\n", - "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.340773\n", - "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.293039\n", - "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.288575\n", - "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.285356\n", - "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.283475\n", - "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.285720\n", - "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.245976\n", - "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.249808\n", - "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.239022\n", - "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.268774\n", - "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.223297\n", - "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.236870\n", - "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.222967\n", - "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.242883\n", - "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.208523\n", - "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.191585\n", - "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.206234\n", - "\n", - "Test set: Average loss: 4.2921\n", - "Class 0 accuracy: 971.0/980(99%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.016127\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.018997\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.004281\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.004884\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.006038\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.012006\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.009289\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.002473\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.002702\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.012154\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.018935\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.004237\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.003406\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.008378\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.003461\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.018804\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.015821\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.003116\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.002931\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.004047\n", + "\n", + "Test set: Average loss: 8.5887\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -1204,493 +600,243 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.222183\n", - "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.175392\n", - "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.230008\n", - "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.246189\n", - "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.224284\n", - "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.172705\n", - "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.188962\n", - "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.212664\n", - "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.197847\n", - "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.161129\n", - "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.160840\n", - "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.193788\n", - "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.150140\n", - "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.193050\n", - "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.173765\n", - "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.170651\n", - "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.170728\n", - "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.179045\n", - "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.156496\n", - "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.174930\n", - "\n", - "Test set: Average loss: 4.6719\n", - "Class 0 accuracy: 972.0/980(99%)\n", - "Class 1 accuracy: 1134.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.150109\n", - "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.133148\n", - "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.143406\n", - "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.210281\n", - "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.129901\n", - "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.140156\n", - "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.127928\n", - "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.153185\n", - "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.132688\n", - "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.174982\n", - "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.174245\n", - "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.147878\n", - "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.105936\n", - "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.139824\n", - "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.128497\n", - "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.102555\n", - "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.149713\n", - "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.204445\n", - "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.173781\n", - "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.104449\n", - "\n", - "Test set: Average loss: 4.9040\n", - "Class 0 accuracy: 972.0/980(99%)\n", - "Class 1 accuracy: 1134.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/12089 (0%)]\tLoss: 7.002198\n", - "Train Epoch: 1 [640/12089 (5%)]\tLoss: 6.786501\n", - "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 6.051014\n", - "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 6.422165\n", - "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 5.702563\n", - "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 5.380751\n", - "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 4.846919\n", - "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 4.511275\n", - "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 4.290347\n", - "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 3.839983\n", - "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 3.078847\n", - "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 2.839584\n", - "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 2.448348\n", - "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 2.193519\n", - "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 1.988640\n", - "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 1.651685\n", - "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 1.662965\n", - "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 1.390365\n", - "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 1.214716\n", - "\n", - "Test set: Average loss: 2.9396\n", - "Class 0 accuracy: 554.0/980(57%)\n", - "Class 1 accuracy: 1033.0/1135(91%)\n", - "Class 2 accuracy: 387.0/1032(38%)\n", - "Class 3 accuracy: 1008.0/1010(100%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12089 (0%)]\tLoss: 1.242918\n", - "Train Epoch: 2 [640/12089 (5%)]\tLoss: 1.003339\n", - "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 0.984789\n", - "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.937961\n", - "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.883540\n", - "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.840368\n", - "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 0.937714\n", - "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.909657\n", - "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.840488\n", - "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.763511\n", - "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.767492\n", - "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.721862\n", - "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 0.698475\n", - "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.630833\n", - "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.732636\n", - "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.686765\n", - "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.647560\n", - "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.584798\n", - "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.605022\n", - "\n", - "Test set: Average loss: 3.8344\n", + "Train Epoch: 1 [0/12089 (0%)]\tLoss: 10.857133\n", + "Train Epoch: 1 [640/12089 (5%)]\tLoss: 6.280286\n", + "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 2.301530\n", + "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 0.905669\n", + "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 0.688727\n", + "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 0.598405\n", + "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 0.462726\n", + "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 0.345897\n", + "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 0.380626\n", + "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 0.280428\n", + "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 0.216660\n", + "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 0.167003\n", + "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 0.275916\n", + "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 0.326823\n", + "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 0.258519\n", + "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 0.233105\n", + "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 0.235713\n", + "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 0.265890\n", + "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 0.262226\n", + "\n", + "Test set: Average loss: 6.2382\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 889.0/1032(86%)\n", - "Class 3 accuracy: 985.0/1010(98%)\n", + "Class 2 accuracy: 992.0/1032(96%)\n", + "Class 3 accuracy: 987.0/1010(98%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.633021\n", - "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.661086\n", - "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.531795\n", - "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.595388\n", - "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.484488\n", - "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.610725\n", - "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.539676\n", - "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.555348\n", - "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.475156\n", - "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.532515\n", - "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.561437\n", - "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.513701\n", - "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.469366\n", - "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.517332\n", - "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.443565\n", - "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.427636\n", - "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.427255\n", - "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.556653\n", - "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.481399\n", - "\n", - "Test set: Average loss: 4.3145\n", + "Train Epoch: 2 [0/12089 (0%)]\tLoss: 0.099378\n", + "Train Epoch: 2 [640/12089 (5%)]\tLoss: 0.116401\n", + "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 0.155221\n", + "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.109446\n", + "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.104514\n", + "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.219575\n", + "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 0.151700\n", + "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.162770\n", + "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.152628\n", + "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.186006\n", + "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.095261\n", + "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.152865\n", + "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 0.046197\n", + "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.068629\n", + "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.133037\n", + "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.106119\n", + "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.073823\n", + "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.117314\n", + "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.144778\n", + "\n", + "Test set: Average loss: 7.2467\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 945.0/1032(92%)\n", - "Class 3 accuracy: 967.0/1010(96%)\n", + "Class 2 accuracy: 998.0/1032(97%)\n", + "Class 3 accuracy: 994.0/1010(98%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12089 (0%)]\tLoss: 0.505337\n", - "Train Epoch: 4 [640/12089 (5%)]\tLoss: 0.464085\n", - "Train Epoch: 4 [1280/12089 (11%)]\tLoss: 0.518291\n", - "Train Epoch: 4 [1920/12089 (16%)]\tLoss: 0.452366\n", - "Train Epoch: 4 [2560/12089 (21%)]\tLoss: 0.405918\n", - "Train Epoch: 4 [3200/12089 (26%)]\tLoss: 0.502257\n", - "Train Epoch: 4 [3840/12089 (32%)]\tLoss: 0.448973\n", - "Train Epoch: 4 [4480/12089 (37%)]\tLoss: 0.445046\n", - "Train Epoch: 4 [5120/12089 (42%)]\tLoss: 0.495061\n", - "Train Epoch: 4 [5760/12089 (48%)]\tLoss: 0.456786\n", - "Train Epoch: 4 [6400/12089 (53%)]\tLoss: 0.371738\n", - "Train Epoch: 4 [7040/12089 (58%)]\tLoss: 0.468638\n", - "Train Epoch: 4 [7680/12089 (63%)]\tLoss: 0.495899\n", - "Train Epoch: 4 [8320/12089 (69%)]\tLoss: 0.453645\n", - "Train Epoch: 4 [8960/12089 (74%)]\tLoss: 0.479238\n", - "Train Epoch: 4 [9600/12089 (79%)]\tLoss: 0.458163\n", - "Train Epoch: 4 [10240/12089 (85%)]\tLoss: 0.446410\n", - "Train Epoch: 4 [10880/12089 (90%)]\tLoss: 0.441910\n", - "Train Epoch: 4 [11520/12089 (95%)]\tLoss: 0.430284\n", - "\n", - "Test set: Average loss: 4.5708\n", + "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.102792\n", + "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.209812\n", + "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.079453\n", + "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.146311\n", + "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.057011\n", + "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.062497\n", + "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.114005\n", + "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.089880\n", + "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.057159\n", + "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.117361\n", + "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.098925\n", + "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.069072\n", + "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.111345\n", + "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.131783\n", + "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.150885\n", + "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.079096\n", + "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.082054\n", + "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.129982\n", + "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.066340\n", + "\n", + "Test set: Average loss: 7.6576\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 952.0/1032(92%)\n", - "Class 3 accuracy: 969.0/1010(96%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12089 (0%)]\tLoss: 0.405303\n", - "Train Epoch: 5 [640/12089 (5%)]\tLoss: 0.396980\n", - "Train Epoch: 5 [1280/12089 (11%)]\tLoss: 0.421218\n", - "Train Epoch: 5 [1920/12089 (16%)]\tLoss: 0.459768\n", - "Train Epoch: 5 [2560/12089 (21%)]\tLoss: 0.354826\n", - "Train Epoch: 5 [3200/12089 (26%)]\tLoss: 0.372944\n", - "Train Epoch: 5 [3840/12089 (32%)]\tLoss: 0.394097\n", - "Train Epoch: 5 [4480/12089 (37%)]\tLoss: 0.444731\n", - "Train Epoch: 5 [5120/12089 (42%)]\tLoss: 0.470775\n", - "Train Epoch: 5 [5760/12089 (48%)]\tLoss: 0.414834\n", - "Train Epoch: 5 [6400/12089 (53%)]\tLoss: 0.451856\n", - "Train Epoch: 5 [7040/12089 (58%)]\tLoss: 0.390931\n", - "Train Epoch: 5 [7680/12089 (63%)]\tLoss: 0.392495\n", - "Train Epoch: 5 [8320/12089 (69%)]\tLoss: 0.341354\n", - "Train Epoch: 5 [8960/12089 (74%)]\tLoss: 0.355052\n", - "Train Epoch: 5 [9600/12089 (79%)]\tLoss: 0.414375\n", - "Train Epoch: 5 [10240/12089 (85%)]\tLoss: 0.419718\n", - "Train Epoch: 5 [10880/12089 (90%)]\tLoss: 0.367832\n", - "Train Epoch: 5 [11520/12089 (95%)]\tLoss: 0.358470\n", - "\n", - "Test set: Average loss: 4.7194\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 953.0/1032(92%)\n", - "Class 3 accuracy: 970.0/1010(96%)\n", + "Class 2 accuracy: 1007.0/1032(98%)\n", + "Class 3 accuracy: 985.0/1010(98%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/11263 (0%)]\tLoss: 6.261249\n", - "Train Epoch: 1 [640/11263 (6%)]\tLoss: 5.999681\n", - "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 5.607321\n", - "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 5.542882\n", - "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 4.963273\n", - "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 4.750457\n", - "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 4.334918\n", - "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 3.912877\n", - "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 3.827431\n", - "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 3.393839\n", - "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 3.033727\n", - "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 2.671916\n", - "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 2.473807\n", - "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 2.285081\n", - "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 1.972579\n", - "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 1.953343\n", - "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 1.653112\n", - "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 1.666049\n", - "\n", - "Test set: Average loss: 2.6135\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 242.0/1135(21%)\n", - "Class 2 accuracy: 341.0/1032(33%)\n", - "Class 3 accuracy: 431.0/1010(43%)\n", - "Class 4 accuracy: 982.0/982(100%)\n", - "Class 5 accuracy: 11.0/892(1%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/11263 (0%)]\tLoss: 1.265681\n", - "Train Epoch: 2 [640/11263 (6%)]\tLoss: 1.242094\n", - "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 1.308110\n", - "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 1.304853\n", - "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 1.242684\n", - "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 1.155575\n", - "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 1.025319\n", - "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 1.151237\n", - "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 1.071076\n", - "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 0.978908\n", - "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.869457\n", - "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.841398\n", - "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.893406\n", - "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.835585\n", - "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.868128\n", - "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.763401\n", - "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.905359\n", - "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.842730\n", - "\n", - "Test set: Average loss: 3.4385\n", + "Train Epoch: 1 [0/11263 (0%)]\tLoss: 10.835564\n", + "Train Epoch: 1 [640/11263 (6%)]\tLoss: 5.729345\n", + "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 2.635014\n", + "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 1.219099\n", + "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 0.913658\n", + "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 0.655098\n", + "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 0.466011\n", + "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 0.539344\n", + "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 0.249651\n", + "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 0.209131\n", + "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 0.223062\n", + "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 0.228752\n", + "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 0.198413\n", + "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 0.215570\n", + "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 0.272983\n", + "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 0.155609\n", + "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 0.087590\n", + "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 0.132957\n", + "\n", + "Test set: Average loss: 7.1306\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 979.0/982(100%)\n", - "Class 5 accuracy: 808.0/892(91%)\n", + "Class 4 accuracy: 977.0/982(99%)\n", + "Class 5 accuracy: 866.0/892(97%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.688606\n", - "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.747074\n", - "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.699562\n", - "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.687192\n", - "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.694984\n", - "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.643804\n", - "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.637270\n", - "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.776547\n", - "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.624326\n", - "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.763693\n", - "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.619411\n", - "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.672091\n", - "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.640160\n", - "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.594804\n", - "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.712096\n", - "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.584561\n", - "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.490905\n", - "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.511629\n", - "\n", - "Test set: Average loss: 3.9981\n", + "Train Epoch: 2 [0/11263 (0%)]\tLoss: 0.130704\n", + "Train Epoch: 2 [640/11263 (6%)]\tLoss: 0.123305\n", + "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 0.092606\n", + "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 0.108018\n", + "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 0.059542\n", + "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 0.051525\n", + "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 0.105634\n", + "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 0.075492\n", + "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 0.056117\n", + "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 0.119122\n", + "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.098337\n", + "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.049512\n", + "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.070381\n", + "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.070122\n", + "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.074574\n", + "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.085832\n", + "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.194243\n", + "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.052719\n", + "\n", + "Test set: Average loss: 8.4438\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 975.0/982(99%)\n", - "Class 5 accuracy: 837.0/892(94%)\n", + "Class 4 accuracy: 978.0/982(100%)\n", + "Class 5 accuracy: 872.0/892(98%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/11263 (0%)]\tLoss: 0.560350\n", - "Train Epoch: 4 [640/11263 (6%)]\tLoss: 0.549644\n", - "Train Epoch: 4 [1280/11263 (11%)]\tLoss: 0.548100\n", - "Train Epoch: 4 [1920/11263 (17%)]\tLoss: 0.523234\n", - "Train Epoch: 4 [2560/11263 (23%)]\tLoss: 0.563891\n", - "Train Epoch: 4 [3200/11263 (28%)]\tLoss: 0.462694\n", - "Train Epoch: 4 [3840/11263 (34%)]\tLoss: 0.562608\n", - "Train Epoch: 4 [4480/11263 (40%)]\tLoss: 0.446004\n", - "Train Epoch: 4 [5120/11263 (45%)]\tLoss: 0.511273\n", - "Train Epoch: 4 [5760/11263 (51%)]\tLoss: 0.548768\n", - "Train Epoch: 4 [6400/11263 (57%)]\tLoss: 0.529422\n", - "Train Epoch: 4 [7040/11263 (62%)]\tLoss: 0.544079\n", - "Train Epoch: 4 [7680/11263 (68%)]\tLoss: 0.428724\n", - "Train Epoch: 4 [8320/11263 (74%)]\tLoss: 0.600822\n", - "Train Epoch: 4 [8960/11263 (80%)]\tLoss: 0.474362\n", - "Train Epoch: 4 [9600/11263 (85%)]\tLoss: 0.595750\n", - "Train Epoch: 4 [10240/11263 (91%)]\tLoss: 0.544630\n", - "Train Epoch: 4 [10880/11263 (97%)]\tLoss: 0.506346\n", - "\n", - "Test set: Average loss: 4.3219\n", + "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.031168\n", + "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.133256\n", + "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.064342\n", + "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.081790\n", + "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.055577\n", + "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.031944\n", + "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.079894\n", + "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.054432\n", + "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.032932\n", + "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.054515\n", + "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.015534\n", + "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.073943\n", + "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.051291\n", + "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.071271\n", + "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.078468\n", + "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.074505\n", + "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.041854\n", + "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.051243\n", + "\n", + "Test set: Average loss: 9.0650\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 974.0/982(99%)\n", - "Class 5 accuracy: 841.0/892(94%)\n", + "Class 4 accuracy: 978.0/982(100%)\n", + "Class 5 accuracy: 879.0/892(99%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/11263 (0%)]\tLoss: 0.355252\n", - "Train Epoch: 5 [640/11263 (6%)]\tLoss: 0.517941\n", - "Train Epoch: 5 [1280/11263 (11%)]\tLoss: 0.526465\n", - "Train Epoch: 5 [1920/11263 (17%)]\tLoss: 0.523074\n", - "Train Epoch: 5 [2560/11263 (23%)]\tLoss: 0.433639\n", - "Train Epoch: 5 [3200/11263 (28%)]\tLoss: 0.434077\n", - "Train Epoch: 5 [3840/11263 (34%)]\tLoss: 0.403323\n", - "Train Epoch: 5 [4480/11263 (40%)]\tLoss: 0.505131\n", - "Train Epoch: 5 [5120/11263 (45%)]\tLoss: 0.355989\n", - "Train Epoch: 5 [5760/11263 (51%)]\tLoss: 0.490564\n", - "Train Epoch: 5 [6400/11263 (57%)]\tLoss: 0.399952\n", - "Train Epoch: 5 [7040/11263 (62%)]\tLoss: 0.436878\n", - "Train Epoch: 5 [7680/11263 (68%)]\tLoss: 0.491910\n", - "Train Epoch: 5 [8320/11263 (74%)]\tLoss: 0.429957\n", - "Train Epoch: 5 [8960/11263 (80%)]\tLoss: 0.495502\n", - "Train Epoch: 5 [9600/11263 (85%)]\tLoss: 0.446051\n", - "Train Epoch: 5 [10240/11263 (91%)]\tLoss: 0.364511\n", - "Train Epoch: 5 [10880/11263 (97%)]\tLoss: 0.447680\n", - "\n", - "Test set: Average loss: 4.5150\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 974.0/982(99%)\n", - "Class 5 accuracy: 843.0/892(95%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/12183 (0%)]\tLoss: 7.209232\n", - "Train Epoch: 1 [640/12183 (5%)]\tLoss: 7.299924\n", - "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 6.381386\n", - "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 6.263927\n", - "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 5.731481\n", - "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 5.564906\n", - "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 4.826056\n", - "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 4.433992\n", - "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 4.331242\n", - "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 3.656218\n", - "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 3.236688\n", - "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 2.764972\n", - "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 2.587098\n", - "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 2.090186\n", - "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 2.049698\n", - "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 1.641774\n", - "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 1.447641\n", - "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 1.294460\n", - "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 1.226808\n", - "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 0.847535\n", - "\n", - "Test set: Average loss: 2.5262\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 1.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 957.0/958(100%)\n", - "Class 7 accuracy: 795.0/1028(77%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12183 (0%)]\tLoss: 1.063643\n", - "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.945048\n", - "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.910895\n", - "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.803437\n", - "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.714711\n", - "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.731389\n", - "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.697865\n", - "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.518302\n", - "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.506918\n", - "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 0.638351\n", - "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.607182\n", - "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.582088\n", - "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.526564\n", - "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.453763\n", - "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 0.463578\n", - "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.505179\n", - "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 0.390394\n", - "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.431393\n", - "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.422808\n", - "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.379329\n", - "\n", - "Test set: Average loss: 3.8944\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 954.0/958(100%)\n", - "Class 7 accuracy: 1005.0/1028(98%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.411217\n", - "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.430715\n", - "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.321807\n", - "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.305609\n", - "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.329529\n", - "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.344710\n", - "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.351153\n", - "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.355009\n", - "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.316889\n", - "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.268590\n", - "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.269210\n", - "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.272690\n", - "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.299527\n", - "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.294239\n", - "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.256061\n", - "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.263354\n", - "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.266107\n", - "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.301182\n", - "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.221701\n", - "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.256709\n", - "\n", - "Test set: Average loss: 4.6037\n", + "Train Epoch: 1 [0/12183 (0%)]\tLoss: 12.640953\n", + "Train Epoch: 1 [640/12183 (5%)]\tLoss: 6.948784\n", + "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 2.239110\n", + "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 0.789898\n", + "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 0.433876\n", + "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 0.327010\n", + "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 0.240610\n", + "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 0.189328\n", + "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 0.189419\n", + "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 0.063147\n", + "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 0.061185\n", + "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 0.115183\n", + "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 0.030512\n", + "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 0.037145\n", + "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 0.089052\n", + "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 0.044766\n", + "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 0.027388\n", + "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 0.041345\n", + "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 0.022225\n", + "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 0.004926\n", + "\n", + "Test set: Average loss: 7.6796\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 954.0/958(100%)\n", - "Class 7 accuracy: 1012.0/1028(98%)\n", + "Class 6 accuracy: 955.0/958(100%)\n", + "Class 7 accuracy: 1017.0/1028(99%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12183 (0%)]\tLoss: 0.200790\n", - "Train Epoch: 4 [640/12183 (5%)]\tLoss: 0.200424\n", - "Train Epoch: 4 [1280/12183 (10%)]\tLoss: 0.190599\n", - "Train Epoch: 4 [1920/12183 (16%)]\tLoss: 0.205490\n", - "Train Epoch: 4 [2560/12183 (21%)]\tLoss: 0.245161\n", - "Train Epoch: 4 [3200/12183 (26%)]\tLoss: 0.154059\n", - "Train Epoch: 4 [3840/12183 (31%)]\tLoss: 0.181401\n", - "Train Epoch: 4 [4480/12183 (37%)]\tLoss: 0.283187\n", - "Train Epoch: 4 [5120/12183 (42%)]\tLoss: 0.176126\n", - "Train Epoch: 4 [5760/12183 (47%)]\tLoss: 0.218665\n", - "Train Epoch: 4 [6400/12183 (52%)]\tLoss: 0.294239\n", - "Train Epoch: 4 [7040/12183 (58%)]\tLoss: 0.213903\n", - "Train Epoch: 4 [7680/12183 (63%)]\tLoss: 0.233052\n", - "Train Epoch: 4 [8320/12183 (68%)]\tLoss: 0.161038\n", - "Train Epoch: 4 [8960/12183 (73%)]\tLoss: 0.211654\n", - "Train Epoch: 4 [9600/12183 (79%)]\tLoss: 0.192449\n", - "Train Epoch: 4 [10240/12183 (84%)]\tLoss: 0.161328\n", - "Train Epoch: 4 [10880/12183 (89%)]\tLoss: 0.197734\n", - "Train Epoch: 4 [11520/12183 (94%)]\tLoss: 0.191102\n", - "Train Epoch: 4 [4370/12183 (99%)]\tLoss: 0.376056\n", - "\n", - "Test set: Average loss: 4.9524\n", + "Train Epoch: 2 [0/12183 (0%)]\tLoss: 0.056296\n", + "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.026770\n", + "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.014056\n", + "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.026122\n", + "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.025161\n", + "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.033366\n", + "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.011129\n", + "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.034492\n", + "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.009984\n", + "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 0.035312\n", + "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.028434\n", + "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.012921\n", + "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.009203\n", + "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.034064\n", + "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 0.018005\n", + "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.007107\n", + "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 0.003789\n", + "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.056796\n", + "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.008388\n", + "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.008049\n", + "\n", + "Test set: Average loss: 8.7098\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", @@ -1698,31 +844,31 @@ "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 955.0/958(100%)\n", - "Class 7 accuracy: 1013.0/1028(99%)\n", + "Class 7 accuracy: 1021.0/1028(99%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12183 (0%)]\tLoss: 0.250694\n", - "Train Epoch: 5 [640/12183 (5%)]\tLoss: 0.137549\n", - "Train Epoch: 5 [1280/12183 (10%)]\tLoss: 0.179946\n", - "Train Epoch: 5 [1920/12183 (16%)]\tLoss: 0.172115\n", - "Train Epoch: 5 [2560/12183 (21%)]\tLoss: 0.216046\n", - "Train Epoch: 5 [3200/12183 (26%)]\tLoss: 0.137594\n", - "Train Epoch: 5 [3840/12183 (31%)]\tLoss: 0.167268\n", - "Train Epoch: 5 [4480/12183 (37%)]\tLoss: 0.215348\n", - "Train Epoch: 5 [5120/12183 (42%)]\tLoss: 0.190677\n", - "Train Epoch: 5 [5760/12183 (47%)]\tLoss: 0.143424\n", - "Train Epoch: 5 [6400/12183 (52%)]\tLoss: 0.176460\n", - "Train Epoch: 5 [7040/12183 (58%)]\tLoss: 0.115466\n", - "Train Epoch: 5 [7680/12183 (63%)]\tLoss: 0.123880\n", - "Train Epoch: 5 [8320/12183 (68%)]\tLoss: 0.172899\n", - "Train Epoch: 5 [8960/12183 (73%)]\tLoss: 0.121368\n", - "Train Epoch: 5 [9600/12183 (79%)]\tLoss: 0.117190\n", - "Train Epoch: 5 [10240/12183 (84%)]\tLoss: 0.193983\n", - "Train Epoch: 5 [10880/12183 (89%)]\tLoss: 0.137996\n", - "Train Epoch: 5 [11520/12183 (94%)]\tLoss: 0.165303\n", - "Train Epoch: 5 [4370/12183 (99%)]\tLoss: 0.120738\n", - "\n", - "Test set: Average loss: 5.1628\n", + "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.031829\n", + "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.026151\n", + "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.013025\n", + "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.015742\n", + "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.036039\n", + "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.019850\n", + "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.021591\n", + "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.011566\n", + "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.012161\n", + "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.005265\n", + "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.005189\n", + "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.023125\n", + "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.058819\n", + "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.027194\n", + "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.010728\n", + "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.002767\n", + "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.006029\n", + "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.090709\n", + "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.003533\n", + "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.005167\n", + "\n", + "Test set: Average loss: 9.1796\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", @@ -1730,61 +876,30 @@ "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 955.0/958(100%)\n", - "Class 7 accuracy: 1014.0/1028(99%)\n", + "Class 7 accuracy: 1021.0/1028(99%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/11800 (0%)]\tLoss: 8.108945\n", - "Train Epoch: 1 [640/11800 (5%)]\tLoss: 7.738531\n", - "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 6.640255\n", - "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 6.513710\n", - "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 5.460023\n", - "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 5.351851\n", - "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 4.810606\n", - "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 4.409184\n", - "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 3.466255\n", - "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 3.398129\n", - "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 2.812559\n", - "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 2.539098\n", - "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 1.932615\n", - "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 1.948097\n", - "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 1.529168\n", - "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 1.568914\n", - "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 1.332329\n", - "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 1.441239\n", - "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 1.161227\n", - "\n", - "Test set: Average loss: 2.4228\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 485.0/958(51%)\n", - "Class 7 accuracy: 345.0/1028(34%)\n", - "Class 8 accuracy: 962.0/974(99%)\n", - "Class 9 accuracy: 735.0/1009(73%)\n", - "Train Epoch: 2 [0/11800 (0%)]\tLoss: 1.033281\n", - "Train Epoch: 2 [640/11800 (5%)]\tLoss: 1.074798\n", - "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 1.087005\n", - "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 1.221566\n", - "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 1.020146\n", - "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 1.010463\n", - "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.871487\n", - "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.892453\n", - "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.761051\n", - "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.883746\n", - "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.881131\n", - "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.761468\n", - "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.702959\n", - "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.575911\n", - "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.668820\n", - "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.780607\n", - "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.565945\n", - "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.687550\n", - "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.551138\n", - "\n", - "Test set: Average loss: 3.3994\n", + "Train Epoch: 1 [0/11800 (0%)]\tLoss: 14.120369\n", + "Train Epoch: 1 [640/11800 (5%)]\tLoss: 7.705572\n", + "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 2.772657\n", + "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 1.523421\n", + "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 0.632249\n", + "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 0.823988\n", + "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 0.649929\n", + "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 0.382820\n", + "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 0.287871\n", + "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 0.270225\n", + "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 0.250052\n", + "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 0.436681\n", + "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 0.205961\n", + "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 0.226867\n", + "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 0.178260\n", + "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 0.159317\n", + "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 0.402756\n", + "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 0.158059\n", + "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 0.195788\n", + "\n", + "Test set: Average loss: 5.9943\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", @@ -1793,60 +908,29 @@ "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 940.0/974(97%)\n", - "Class 9 accuracy: 914.0/1009(91%)\n", - "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.637666\n", - "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.512363\n", - "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.587236\n", - "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.496453\n", - "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.617932\n", - "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.538651\n", - "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.471803\n", - "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.569236\n", - "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.473018\n", - "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.661038\n", - "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.436601\n", - "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.551020\n", - "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.422065\n", - "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.436460\n", - "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.521548\n", - "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.582636\n", - "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.460395\n", - "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.637835\n", - "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.514315\n", - "\n", - "Test set: Average loss: 3.9214\n", - "Class 0 accuracy: 0.0/980(0%)\n", - "Class 1 accuracy: 0.0/1135(0%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 934.0/974(96%)\n", - "Class 9 accuracy: 939.0/1009(93%)\n", - "Train Epoch: 4 [0/11800 (0%)]\tLoss: 0.498162\n", - "Train Epoch: 4 [640/11800 (5%)]\tLoss: 0.536717\n", - "Train Epoch: 4 [1280/11800 (11%)]\tLoss: 0.436568\n", - "Train Epoch: 4 [1920/11800 (16%)]\tLoss: 0.471787\n", - "Train Epoch: 4 [2560/11800 (22%)]\tLoss: 0.497887\n", - "Train Epoch: 4 [3200/11800 (27%)]\tLoss: 0.444460\n", - "Train Epoch: 4 [3840/11800 (32%)]\tLoss: 0.448744\n", - "Train Epoch: 4 [4480/11800 (38%)]\tLoss: 0.372841\n", - "Train Epoch: 4 [5120/11800 (43%)]\tLoss: 0.465649\n", - "Train Epoch: 4 [5760/11800 (49%)]\tLoss: 0.490277\n", - "Train Epoch: 4 [6400/11800 (54%)]\tLoss: 0.463720\n", - "Train Epoch: 4 [7040/11800 (59%)]\tLoss: 0.355945\n", - "Train Epoch: 4 [7680/11800 (65%)]\tLoss: 0.438429\n", - "Train Epoch: 4 [8320/11800 (70%)]\tLoss: 0.508788\n", - "Train Epoch: 4 [8960/11800 (76%)]\tLoss: 0.413552\n", - "Train Epoch: 4 [9600/11800 (81%)]\tLoss: 0.395993\n", - "Train Epoch: 4 [10240/11800 (86%)]\tLoss: 0.410553\n", - "Train Epoch: 4 [10880/11800 (92%)]\tLoss: 0.409377\n", - "Train Epoch: 4 [11520/11800 (97%)]\tLoss: 0.400534\n", - "\n", - "Test set: Average loss: 4.2109\n", + "Class 8 accuracy: 943.0/974(97%)\n", + "Class 9 accuracy: 974.0/1009(97%)\n", + "Train Epoch: 2 [0/11800 (0%)]\tLoss: 0.157916\n", + "Train Epoch: 2 [640/11800 (5%)]\tLoss: 0.187881\n", + "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 0.283773\n", + "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 0.135888\n", + "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 0.211785\n", + "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 0.238753\n", + "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.121974\n", + "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.074522\n", + "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.239114\n", + "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.129581\n", + "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.055795\n", + "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.349395\n", + "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.076350\n", + "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.072271\n", + "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.103121\n", + "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.343085\n", + "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.095953\n", + "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.095618\n", + "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.114838\n", + "\n", + "Test set: Average loss: 6.6632\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", @@ -1855,29 +939,29 @@ "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 930.0/974(95%)\n", - "Class 9 accuracy: 948.0/1009(94%)\n", - "Train Epoch: 5 [0/11800 (0%)]\tLoss: 0.441779\n", - "Train Epoch: 5 [640/11800 (5%)]\tLoss: 0.349478\n", - "Train Epoch: 5 [1280/11800 (11%)]\tLoss: 0.347695\n", - "Train Epoch: 5 [1920/11800 (16%)]\tLoss: 0.374920\n", - "Train Epoch: 5 [2560/11800 (22%)]\tLoss: 0.371782\n", - "Train Epoch: 5 [3200/11800 (27%)]\tLoss: 0.405380\n", - "Train Epoch: 5 [3840/11800 (32%)]\tLoss: 0.493990\n", - "Train Epoch: 5 [4480/11800 (38%)]\tLoss: 0.383761\n", - "Train Epoch: 5 [5120/11800 (43%)]\tLoss: 0.361125\n", - "Train Epoch: 5 [5760/11800 (49%)]\tLoss: 0.377500\n", - "Train Epoch: 5 [6400/11800 (54%)]\tLoss: 0.411204\n", - "Train Epoch: 5 [7040/11800 (59%)]\tLoss: 0.467779\n", - "Train Epoch: 5 [7680/11800 (65%)]\tLoss: 0.445416\n", - "Train Epoch: 5 [8320/11800 (70%)]\tLoss: 0.303449\n", - "Train Epoch: 5 [8960/11800 (76%)]\tLoss: 0.319432\n", - "Train Epoch: 5 [9600/11800 (81%)]\tLoss: 0.331827\n", - "Train Epoch: 5 [10240/11800 (86%)]\tLoss: 0.377502\n", - "Train Epoch: 5 [10880/11800 (92%)]\tLoss: 0.406466\n", - "Train Epoch: 5 [11520/11800 (97%)]\tLoss: 0.405720\n", - "\n", - "Test set: Average loss: 4.3858\n", + "Class 8 accuracy: 967.0/974(99%)\n", + "Class 9 accuracy: 965.0/1009(96%)\n", + "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.126834\n", + "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.187850\n", + "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.102141\n", + "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.036415\n", + "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.165435\n", + "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.109672\n", + "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.070627\n", + "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.047646\n", + "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.051905\n", + "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.264070\n", + "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.211393\n", + "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.062177\n", + "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.033032\n", + "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.068230\n", + "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.071904\n", + "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.102863\n", + "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.046137\n", + "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.120950\n", + "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.101907\n", + "\n", + "Test set: Average loss: 6.9242\n", "Class 0 accuracy: 0.0/980(0%)\n", "Class 1 accuracy: 0.0/1135(0%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", @@ -1886,95 +970,31 @@ "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 929.0/974(95%)\n", - "Class 9 accuracy: 950.0/1009(94%)\n", - "Train Epoch: 1 [0/12665 (0%)]\tLoss: 5.571240\n", - "Train Epoch: 1 [640/12665 (5%)]\tLoss: 5.058652\n", - "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 4.223537\n", - "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 3.769430\n", - "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 3.397155\n", - "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 3.066763\n", - "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 2.407099\n", - "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 2.510794\n", - "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.850332\n", - "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.656529\n", - "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.517869\n", - "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.028974\n", - "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.833506\n", - "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.765792\n", - "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.600499\n", - "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.491542\n", - "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.525203\n", - "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.473181\n", - "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.445249\n", - "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.329707\n", - "\n", - "Test set: Average loss: 2.6586\n", - "Class 0 accuracy: 974.0/980(99%)\n", - "Class 1 accuracy: 1134.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 616.0/1009(61%)\n", - "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.174450\n", - "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.286020\n", - "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.380822\n", - "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.200067\n", - "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.233174\n", - "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.215359\n", - "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.261502\n", - "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.193090\n", - "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.201911\n", - "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.123239\n", - "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.151434\n", - "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.161058\n", - "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.121602\n", - "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.152282\n", - "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.138010\n", - "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.116535\n", - "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.148996\n", - "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.094655\n", - "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.093630\n", - "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.100545\n", - "\n", - "Test set: Average loss: 3.7860\n", - "Class 0 accuracy: 974.0/980(99%)\n", - "Class 1 accuracy: 1134.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.113853\n", - "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.061060\n", - "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.073625\n", - "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.089106\n", - "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.100265\n", - "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.086965\n", - "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.078005\n", - "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.089567\n", - "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.083796\n", - "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.091500\n", - "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.071154\n", - "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.063725\n", - "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.081232\n", - "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.063744\n", - "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.044772\n", - "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.056600\n", - "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.075639\n", - "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.059448\n", - "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.051801\n", - "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.045583\n", - "\n", - "Test set: Average loss: 4.3795\n", - "Class 0 accuracy: 974.0/980(99%)\n", + "Class 8 accuracy: 952.0/974(98%)\n", + "Class 9 accuracy: 978.0/1009(97%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 8.722752\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 3.160372\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 0.653003\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.256268\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.064630\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.089074\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.022682\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.014132\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.011369\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.032196\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.087249\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.010759\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.009488\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.009431\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.017381\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.014684\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.007916\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.008834\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.082196\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.002452\n", + "\n", + "Test set: Average loss: 7.1540\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -1984,29 +1004,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.073423\n", - "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.081250\n", - "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.107188\n", - "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.108589\n", - "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.074006\n", - "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.038409\n", - "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.065204\n", - "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.083654\n", - "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.073944\n", - "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.048630\n", - "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.041222\n", - "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.055742\n", - "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.048848\n", - "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.099426\n", - "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.050589\n", - "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.039493\n", - "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.059188\n", - "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.071380\n", - "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.095400\n", - "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.052493\n", - "\n", - "Test set: Average loss: 4.6909\n", - "Class 0 accuracy: 975.0/980(99%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.000673\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.029478\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.002406\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.008619\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.001777\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.031666\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.133443\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.006141\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.006000\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.003495\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.000851\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.001280\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.000972\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.001776\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.067486\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.001030\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.001892\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.001493\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.047196\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.004952\n", + "\n", + "Test set: Average loss: 7.8296\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -2016,29 +1036,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.042433\n", - "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.045415\n", - "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.045671\n", - "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.116742\n", - "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.042136\n", - "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.053295\n", - "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.035618\n", - "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.055716\n", - "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.043886\n", - "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.052791\n", - "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.079626\n", - "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.044485\n", - "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.027041\n", - "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.041513\n", - "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.034053\n", - "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.028694\n", - "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.054827\n", - "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.182031\n", - "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.068930\n", - "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.022576\n", - "\n", - "Test set: Average loss: 4.8702\n", - "Class 0 accuracy: 976.0/980(100%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.007902\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.003385\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.001230\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.001810\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.001579\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.028920\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.004439\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.001913\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.000407\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.004402\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.009100\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.000980\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.000387\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.004606\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.001144\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.007978\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.011006\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.001300\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.000758\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.001379\n", + "\n", + "Test set: Average loss: 8.1397\n", + "Class 0 accuracy: 978.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -2049,6 +1069,213 @@ "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n" ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "[{0: 0.996938775510204,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.9612403100775194,\n", + " 3: 0.9772277227722772,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.9670542635658915,\n", + " 3: 0.9841584158415841,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.9757751937984496,\n", + " 3: 0.9752475247524752,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.994908350305499,\n", + " 5: 0.9708520179372198,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.9959266802443992,\n", + " 5: 0.9775784753363229,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.9959266802443992,\n", + " 5: 0.9854260089686099,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.9968684759916493,\n", + " 7: 0.9892996108949417,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.9968684759916493,\n", + " 7: 0.9931906614785992,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.9968684759916493,\n", + " 7: 0.9931906614785992,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.9681724845995893,\n", + " 9: 0.9653121902874133,\n", + " 'phase': '8_9'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.9928131416837782,\n", + " 9: 0.956392467789891,\n", + " 'phase': '8_9'},\n", + " {0: 0.0,\n", + " 1: 0.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.9774127310061602,\n", + " 9: 0.9692765113974232,\n", + " 'phase': '8_9'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1_again'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1_again'},\n", + " {0: 0.9979591836734694,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1_again'}]" + ] + }, + "metadata": {}, + "execution_count": 19 } ] }, @@ -2100,41 +1327,41 @@ "history_memory_replay" ], "metadata": { + "id": "LtWvHl_tQCpg", "colab": { "base_uri": "https://localhost:8080/" }, - "id": "LtWvHl_tQCpg", - "outputId": "e4913ffb-5f2b-474f-d24a-bde139af833c" + "outputId": "6705c5fe-9838-4da5-a562-77d7c9a8c6d8" }, - "execution_count": 16, + "execution_count": 20, "outputs": [ { "output_type": "stream", "name": "stdout", "text": [ - "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.295792\n", - "Train Epoch: 1 [640/12665 (5%)]\tLoss: 2.208695\n", - "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 2.106677\n", - "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 1.961109\n", - "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 1.898052\n", - "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 1.824553\n", - "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 1.719246\n", - "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 1.623634\n", - "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 1.617715\n", - "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 1.727536\n", - "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 1.507114\n", - "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 1.447730\n", - "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 1.549878\n", - "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 1.058249\n", - "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 1.447155\n", - "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 1.273197\n", - "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 1.260120\n", - "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 1.187015\n", - "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 1.091164\n", - "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.971557\n", - "\n", - "Test set: Average loss: 2.7060\n", - "Class 0 accuracy: 972.0/980(99%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 2.196357\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 1.335955\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 0.555878\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.146986\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.082966\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.054255\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.011100\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.078007\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.005687\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.004260\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.002415\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.005845\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.005518\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.001475\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.002208\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.000701\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.000352\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.000833\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.002580\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.002562\n", + "\n", + "Test set: Average loss: 7.8370\n", + "Class 0 accuracy: 976.0/980(100%)\n", "Class 1 accuracy: 1134.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -2144,93 +1371,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.952087\n", - "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.869477\n", - "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.858798\n", - "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.809786\n", - "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.799570\n", - "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.890806\n", - "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.805940\n", - "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 1.059435\n", - "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.478667\n", - "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.673640\n", - "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.538314\n", - "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.710136\n", - "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.516661\n", - "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.602048\n", - "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.384920\n", - "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.435023\n", - "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.372631\n", - "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.426314\n", - "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.539168\n", - "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.321303\n", - "\n", - "Test set: Average loss: 3.8263\n", - "Class 0 accuracy: 966.0/980(99%)\n", - "Class 1 accuracy: 1135.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.401120\n", - "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.263190\n", - "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.398854\n", - "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.229336\n", - "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.240626\n", - "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.239559\n", - "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.418891\n", - "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.177813\n", - "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.226682\n", - "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.215379\n", - "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.211677\n", - "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.224589\n", - "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.253302\n", - "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.212234\n", - "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.230823\n", - "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.164656\n", - "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.154504\n", - "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.100245\n", - "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.156521\n", - "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.232217\n", - "\n", - "Test set: Average loss: 4.6647\n", - "Class 0 accuracy: 963.0/980(98%)\n", - "Class 1 accuracy: 1135.0/1135(100%)\n", - "Class 2 accuracy: 0.0/1032(0%)\n", - "Class 3 accuracy: 0.0/1010(0%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.131072\n", - "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.227836\n", - "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.161914\n", - "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.182439\n", - "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.123449\n", - "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.118936\n", - "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.132258\n", - "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.191232\n", - "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.192155\n", - "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.122639\n", - "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.138319\n", - "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.106367\n", - "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.078942\n", - "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.103141\n", - "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.129387\n", - "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.117389\n", - "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.164451\n", - "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.216510\n", - "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.110041\n", - "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.104683\n", - "\n", - "Test set: Average loss: 5.1577\n", - "Class 0 accuracy: 966.0/980(99%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.221930\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.027592\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.065451\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.015034\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.046994\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.008316\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.021686\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.024137\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.002627\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.042552\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.026033\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.002244\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.003471\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.041315\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.008438\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.000700\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.000417\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.002115\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.008961\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.002133\n", + "\n", + "Test set: Average loss: 8.7829\n", + "Class 0 accuracy: 976.0/980(100%)\n", "Class 1 accuracy: 1135.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -2240,29 +1403,29 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.077715\n", - "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.105138\n", - "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.124953\n", - "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.080610\n", - "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.123617\n", - "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.112670\n", - "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.093631\n", - "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.122231\n", - "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.093652\n", - "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.167812\n", - "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.117981\n", - "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.066692\n", - "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.080171\n", - "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.092669\n", - "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.146656\n", - "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.101289\n", - "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.089997\n", - "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.108752\n", - "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.078000\n", - "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.046221\n", - "\n", - "Test set: Average loss: 5.4729\n", - "Class 0 accuracy: 968.0/980(99%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.000570\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.011992\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.000725\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.000835\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.000185\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.001194\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.000802\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.001044\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.001886\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.001518\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.001240\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.005406\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.004714\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.000870\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.001174\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.000833\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.006711\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.006384\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.006488\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.000901\n", + "\n", + "Test set: Average loss: 9.2011\n", + "Class 0 accuracy: 977.0/980(100%)\n", "Class 1 accuracy: 1135.0/1135(100%)\n", "Class 2 accuracy: 0.0/1032(0%)\n", "Class 3 accuracy: 0.0/1010(0%)\n", @@ -2272,61 +1435,30 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/12089 (0%)]\tLoss: 1.166433\n", - "Train Epoch: 1 [640/12089 (5%)]\tLoss: 1.153999\n", - "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 1.238186\n", - "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 1.274190\n", - "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 1.001455\n", - "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 0.980768\n", - "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 0.890982\n", - "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 0.845770\n", - "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 0.915158\n", - "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 0.577478\n", - "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 0.558826\n", - "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 0.697927\n", - "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 0.780273\n", - "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 0.586348\n", - "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 0.634719\n", - "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 0.753965\n", - "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 0.886030\n", - "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 0.913329\n", - "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 0.726805\n", - "\n", - "Test set: Average loss: 2.9830\n", - "Class 0 accuracy: 966.0/980(99%)\n", - "Class 1 accuracy: 1132.0/1135(100%)\n", - "Class 2 accuracy: 109.0/1032(11%)\n", - "Class 3 accuracy: 668.0/1010(66%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12089 (0%)]\tLoss: 0.903527\n", - "Train Epoch: 2 [640/12089 (5%)]\tLoss: 0.690564\n", - "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 1.054734\n", - "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.668291\n", - "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.846006\n", - "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.862174\n", - "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 1.078590\n", - "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.812564\n", - "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.751745\n", - "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.819927\n", - "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.641764\n", - "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.941192\n", - "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 1.113382\n", - "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.745287\n", - "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.845461\n", - "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.675010\n", - "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.772856\n", - "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.668837\n", - "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.776711\n", - "\n", - "Test set: Average loss: 3.1608\n", - "Class 0 accuracy: 828.0/980(84%)\n", - "Class 1 accuracy: 1091.0/1135(96%)\n", - "Class 2 accuracy: 898.0/1032(87%)\n", + "Train Epoch: 1 [0/12089 (0%)]\tLoss: 2.805099\n", + "Train Epoch: 1 [640/12089 (5%)]\tLoss: 1.660801\n", + "Train Epoch: 1 [1280/12089 (11%)]\tLoss: 0.437137\n", + "Train Epoch: 1 [1920/12089 (16%)]\tLoss: 0.808282\n", + "Train Epoch: 1 [2560/12089 (21%)]\tLoss: 0.285198\n", + "Train Epoch: 1 [3200/12089 (26%)]\tLoss: 0.129722\n", + "Train Epoch: 1 [3840/12089 (32%)]\tLoss: 0.145888\n", + "Train Epoch: 1 [4480/12089 (37%)]\tLoss: 0.343596\n", + "Train Epoch: 1 [5120/12089 (42%)]\tLoss: 0.078071\n", + "Train Epoch: 1 [5760/12089 (48%)]\tLoss: 0.098522\n", + "Train Epoch: 1 [6400/12089 (53%)]\tLoss: 0.089895\n", + "Train Epoch: 1 [7040/12089 (58%)]\tLoss: 0.067733\n", + "Train Epoch: 1 [7680/12089 (63%)]\tLoss: 0.046314\n", + "Train Epoch: 1 [8320/12089 (69%)]\tLoss: 0.028943\n", + "Train Epoch: 1 [8960/12089 (74%)]\tLoss: 0.082591\n", + "Train Epoch: 1 [9600/12089 (79%)]\tLoss: 0.024760\n", + "Train Epoch: 1 [10240/12089 (85%)]\tLoss: 0.050374\n", + "Train Epoch: 1 [10880/12089 (90%)]\tLoss: 0.020318\n", + "Train Epoch: 1 [11520/12089 (95%)]\tLoss: 0.025210\n", + "\n", + "Test set: Average loss: 5.2845\n", + "Class 0 accuracy: 829.0/980(85%)\n", + "Class 1 accuracy: 1046.0/1135(92%)\n", + "Class 2 accuracy: 991.0/1032(96%)\n", "Class 3 accuracy: 983.0/1010(97%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", @@ -2334,725 +1466,651 @@ "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.733399\n", - "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.793913\n", - "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.580512\n", - "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.477269\n", - "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.833255\n", - "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.636208\n", - "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.573351\n", - "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.656650\n", - "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.692221\n", - "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.723047\n", - "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.626788\n", - "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.557750\n", - "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.643362\n", - "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.725737\n", - "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.868968\n", - "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.720436\n", - "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.723306\n", - "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.624521\n", - "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.507009\n", - "\n", - "Test set: Average loss: 3.3136\n", - "Class 0 accuracy: 780.0/980(80%)\n", - "Class 1 accuracy: 1067.0/1135(94%)\n", - "Class 2 accuracy: 917.0/1032(89%)\n", - "Class 3 accuracy: 983.0/1010(97%)\n", + "Train Epoch: 2 [0/12089 (0%)]\tLoss: 0.091748\n", + "Train Epoch: 2 [640/12089 (5%)]\tLoss: 0.038480\n", + "Train Epoch: 2 [1280/12089 (11%)]\tLoss: 0.027258\n", + "Train Epoch: 2 [1920/12089 (16%)]\tLoss: 0.040072\n", + "Train Epoch: 2 [2560/12089 (21%)]\tLoss: 0.024616\n", + "Train Epoch: 2 [3200/12089 (26%)]\tLoss: 0.021542\n", + "Train Epoch: 2 [3840/12089 (32%)]\tLoss: 0.016757\n", + "Train Epoch: 2 [4480/12089 (37%)]\tLoss: 0.029563\n", + "Train Epoch: 2 [5120/12089 (42%)]\tLoss: 0.010378\n", + "Train Epoch: 2 [5760/12089 (48%)]\tLoss: 0.020319\n", + "Train Epoch: 2 [6400/12089 (53%)]\tLoss: 0.019660\n", + "Train Epoch: 2 [7040/12089 (58%)]\tLoss: 0.006761\n", + "Train Epoch: 2 [7680/12089 (63%)]\tLoss: 0.026263\n", + "Train Epoch: 2 [8320/12089 (69%)]\tLoss: 0.008666\n", + "Train Epoch: 2 [8960/12089 (74%)]\tLoss: 0.013218\n", + "Train Epoch: 2 [9600/12089 (79%)]\tLoss: 0.002491\n", + "Train Epoch: 2 [10240/12089 (85%)]\tLoss: 0.010161\n", + "Train Epoch: 2 [10880/12089 (90%)]\tLoss: 0.019670\n", + "Train Epoch: 2 [11520/12089 (95%)]\tLoss: 0.012468\n", + "\n", + "Test set: Average loss: 6.1435\n", + "Class 0 accuracy: 764.0/980(78%)\n", + "Class 1 accuracy: 999.0/1135(88%)\n", + "Class 2 accuracy: 1000.0/1032(97%)\n", + "Class 3 accuracy: 988.0/1010(98%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12089 (0%)]\tLoss: 0.624655\n", - "Train Epoch: 4 [640/12089 (5%)]\tLoss: 0.452378\n", - "Train Epoch: 4 [1280/12089 (11%)]\tLoss: 0.457449\n", - "Train Epoch: 4 [1920/12089 (16%)]\tLoss: 0.554645\n", - "Train Epoch: 4 [2560/12089 (21%)]\tLoss: 0.621985\n", - "Train Epoch: 4 [3200/12089 (26%)]\tLoss: 0.527864\n", - "Train Epoch: 4 [3840/12089 (32%)]\tLoss: 0.577068\n", - "Train Epoch: 4 [4480/12089 (37%)]\tLoss: 0.514906\n", - "Train Epoch: 4 [5120/12089 (42%)]\tLoss: 0.581334\n", - "Train Epoch: 4 [5760/12089 (48%)]\tLoss: 0.331880\n", - "Train Epoch: 4 [6400/12089 (53%)]\tLoss: 0.424212\n", - "Train Epoch: 4 [7040/12089 (58%)]\tLoss: 0.527507\n", - "Train Epoch: 4 [7680/12089 (63%)]\tLoss: 0.685347\n", - "Train Epoch: 4 [8320/12089 (69%)]\tLoss: 0.525770\n", - "Train Epoch: 4 [8960/12089 (74%)]\tLoss: 0.417910\n", - "Train Epoch: 4 [9600/12089 (79%)]\tLoss: 0.731371\n", - "Train Epoch: 4 [10240/12089 (85%)]\tLoss: 0.528346\n", - "Train Epoch: 4 [10880/12089 (90%)]\tLoss: 0.454048\n", - "Train Epoch: 4 [11520/12089 (95%)]\tLoss: 0.373003\n", - "\n", - "Test set: Average loss: 3.4222\n", - "Class 0 accuracy: 754.0/980(77%)\n", - "Class 1 accuracy: 1055.0/1135(93%)\n", - "Class 2 accuracy: 918.0/1032(89%)\n", - "Class 3 accuracy: 986.0/1010(98%)\n", + "Train Epoch: 3 [0/12089 (0%)]\tLoss: 0.028908\n", + "Train Epoch: 3 [640/12089 (5%)]\tLoss: 0.017523\n", + "Train Epoch: 3 [1280/12089 (11%)]\tLoss: 0.012286\n", + "Train Epoch: 3 [1920/12089 (16%)]\tLoss: 0.029993\n", + "Train Epoch: 3 [2560/12089 (21%)]\tLoss: 0.014532\n", + "Train Epoch: 3 [3200/12089 (26%)]\tLoss: 0.023068\n", + "Train Epoch: 3 [3840/12089 (32%)]\tLoss: 0.007645\n", + "Train Epoch: 3 [4480/12089 (37%)]\tLoss: 0.016837\n", + "Train Epoch: 3 [5120/12089 (42%)]\tLoss: 0.004771\n", + "Train Epoch: 3 [5760/12089 (48%)]\tLoss: 0.004505\n", + "Train Epoch: 3 [6400/12089 (53%)]\tLoss: 0.085267\n", + "Train Epoch: 3 [7040/12089 (58%)]\tLoss: 0.007249\n", + "Train Epoch: 3 [7680/12089 (63%)]\tLoss: 0.005857\n", + "Train Epoch: 3 [8320/12089 (69%)]\tLoss: 0.036750\n", + "Train Epoch: 3 [8960/12089 (74%)]\tLoss: 0.035684\n", + "Train Epoch: 3 [9600/12089 (79%)]\tLoss: 0.005433\n", + "Train Epoch: 3 [10240/12089 (85%)]\tLoss: 0.006491\n", + "Train Epoch: 3 [10880/12089 (90%)]\tLoss: 0.026140\n", + "Train Epoch: 3 [11520/12089 (95%)]\tLoss: 0.007269\n", + "\n", + "Test set: Average loss: 6.5537\n", + "Class 0 accuracy: 723.0/980(74%)\n", + "Class 1 accuracy: 968.0/1135(85%)\n", + "Class 2 accuracy: 999.0/1032(97%)\n", + "Class 3 accuracy: 992.0/1010(98%)\n", "Class 4 accuracy: 0.0/982(0%)\n", "Class 5 accuracy: 0.0/892(0%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12089 (0%)]\tLoss: 0.546961\n", - "Train Epoch: 5 [640/12089 (5%)]\tLoss: 0.382696\n", - "Train Epoch: 5 [1280/12089 (11%)]\tLoss: 0.616167\n", - "Train Epoch: 5 [1920/12089 (16%)]\tLoss: 0.551108\n", - "Train Epoch: 5 [2560/12089 (21%)]\tLoss: 0.671682\n", - "Train Epoch: 5 [3200/12089 (26%)]\tLoss: 0.434367\n", - "Train Epoch: 5 [3840/12089 (32%)]\tLoss: 0.589797\n", - "Train Epoch: 5 [4480/12089 (37%)]\tLoss: 0.462255\n", - "Train Epoch: 5 [5120/12089 (42%)]\tLoss: 0.427646\n", - "Train Epoch: 5 [5760/12089 (48%)]\tLoss: 0.393138\n", - "Train Epoch: 5 [6400/12089 (53%)]\tLoss: 0.374952\n", - "Train Epoch: 5 [7040/12089 (58%)]\tLoss: 0.392871\n", - "Train Epoch: 5 [7680/12089 (63%)]\tLoss: 0.494981\n", - "Train Epoch: 5 [8320/12089 (69%)]\tLoss: 0.474602\n", - "Train Epoch: 5 [8960/12089 (74%)]\tLoss: 0.418477\n", - "Train Epoch: 5 [9600/12089 (79%)]\tLoss: 0.402891\n", - "Train Epoch: 5 [10240/12089 (85%)]\tLoss: 0.545055\n", - "Train Epoch: 5 [10880/12089 (90%)]\tLoss: 0.465828\n", - "Train Epoch: 5 [11520/12089 (95%)]\tLoss: 0.378968\n", - "\n", - "Test set: Average loss: 3.4964\n", - "Class 0 accuracy: 743.0/980(76%)\n", - "Class 1 accuracy: 1053.0/1135(93%)\n", - "Class 2 accuracy: 928.0/1032(90%)\n", - "Class 3 accuracy: 986.0/1010(98%)\n", - "Class 4 accuracy: 0.0/982(0%)\n", - "Class 5 accuracy: 0.0/892(0%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/11263 (0%)]\tLoss: 0.850781\n", - "Train Epoch: 1 [640/11263 (6%)]\tLoss: 0.798292\n", - "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 0.834117\n", - "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 0.725765\n", - "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 0.676635\n", - "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 0.758110\n", - "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 0.689677\n", - "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 0.686142\n", - "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 0.819930\n", - "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 0.822826\n", - "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 0.597154\n", - "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 0.712456\n", - "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 0.668146\n", - "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 0.641806\n", - "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 0.607866\n", - "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 0.837627\n", - "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 0.767775\n", - "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 0.710244\n", - "\n", - "Test set: Average loss: 2.3788\n", - "Class 0 accuracy: 936.0/980(96%)\n", - "Class 1 accuracy: 1123.0/1135(99%)\n", - "Class 2 accuracy: 808.0/1032(78%)\n", - "Class 3 accuracy: 926.0/1010(92%)\n", - "Class 4 accuracy: 790.0/982(80%)\n", - "Class 5 accuracy: 360.0/892(40%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/11263 (0%)]\tLoss: 0.896705\n", - "Train Epoch: 2 [640/11263 (6%)]\tLoss: 0.905773\n", - "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 0.899539\n", - "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 0.838611\n", - "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 0.892302\n", - "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 1.038975\n", - "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 0.937163\n", - "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 0.748620\n", - "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 0.863919\n", - "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 1.029196\n", - "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.845210\n", - "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.758227\n", - "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.620243\n", - "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.842112\n", - "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.743856\n", - "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.656504\n", - "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.817470\n", - "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.658012\n", - "\n", - "Test set: Average loss: 2.4907\n", - "Class 0 accuracy: 789.0/980(81%)\n", - "Class 1 accuracy: 1107.0/1135(98%)\n", - "Class 2 accuracy: 670.0/1032(65%)\n", - "Class 3 accuracy: 515.0/1010(51%)\n", - "Class 4 accuracy: 942.0/982(96%)\n", - "Class 5 accuracy: 766.0/892(86%)\n", - "Class 6 accuracy: 0.0/958(0%)\n", - "Class 7 accuracy: 0.0/1028(0%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.754302\n", - "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.660190\n", - "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.655176\n", - "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.696439\n", - "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.786622\n", - "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.699489\n", - "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.776751\n", - "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.755700\n", - "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.776476\n", - "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.718861\n", - "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.644046\n", - "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.879339\n", - "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.587297\n", - "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.763207\n", - "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.761769\n", - "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.656073\n", - "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.616851\n", - "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.573584\n", - "\n", - "Test set: Average loss: 2.5840\n", - "Class 0 accuracy: 754.0/980(77%)\n", - "Class 1 accuracy: 1089.0/1135(96%)\n", - "Class 2 accuracy: 640.0/1032(62%)\n", - "Class 3 accuracy: 371.0/1010(37%)\n", - "Class 4 accuracy: 960.0/982(98%)\n", - "Class 5 accuracy: 800.0/892(90%)\n", + "Train Epoch: 1 [0/11263 (0%)]\tLoss: 1.635322\n", + "Train Epoch: 1 [640/11263 (6%)]\tLoss: 0.442154\n", + "Train Epoch: 1 [1280/11263 (11%)]\tLoss: 0.249078\n", + "Train Epoch: 1 [1920/11263 (17%)]\tLoss: 0.270407\n", + "Train Epoch: 1 [2560/11263 (23%)]\tLoss: 0.180369\n", + "Train Epoch: 1 [3200/11263 (28%)]\tLoss: 0.088140\n", + "Train Epoch: 1 [3840/11263 (34%)]\tLoss: 0.171120\n", + "Train Epoch: 1 [4480/11263 (40%)]\tLoss: 0.263797\n", + "Train Epoch: 1 [5120/11263 (45%)]\tLoss: 0.111911\n", + "Train Epoch: 1 [5760/11263 (51%)]\tLoss: 0.117878\n", + "Train Epoch: 1 [6400/11263 (57%)]\tLoss: 0.033867\n", + "Train Epoch: 1 [7040/11263 (62%)]\tLoss: 0.058040\n", + "Train Epoch: 1 [7680/11263 (68%)]\tLoss: 0.034263\n", + "Train Epoch: 1 [8320/11263 (74%)]\tLoss: 0.082758\n", + "Train Epoch: 1 [8960/11263 (80%)]\tLoss: 0.041592\n", + "Train Epoch: 1 [9600/11263 (85%)]\tLoss: 0.035437\n", + "Train Epoch: 1 [10240/11263 (91%)]\tLoss: 0.015268\n", + "Train Epoch: 1 [10880/11263 (97%)]\tLoss: 0.029453\n", + "\n", + "Test set: Average loss: 4.5940\n", + "Class 0 accuracy: 760.0/980(78%)\n", + "Class 1 accuracy: 986.0/1135(87%)\n", + "Class 2 accuracy: 664.0/1032(64%)\n", + "Class 3 accuracy: 367.0/1010(36%)\n", + "Class 4 accuracy: 979.0/982(100%)\n", + "Class 5 accuracy: 864.0/892(97%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/11263 (0%)]\tLoss: 0.648252\n", - "Train Epoch: 4 [640/11263 (6%)]\tLoss: 0.596721\n", - "Train Epoch: 4 [1280/11263 (11%)]\tLoss: 0.558993\n", - "Train Epoch: 4 [1920/11263 (17%)]\tLoss: 0.492765\n", - "Train Epoch: 4 [2560/11263 (23%)]\tLoss: 0.646996\n", - "Train Epoch: 4 [3200/11263 (28%)]\tLoss: 0.737724\n", - "Train Epoch: 4 [3840/11263 (34%)]\tLoss: 0.578851\n", - "Train Epoch: 4 [4480/11263 (40%)]\tLoss: 0.646620\n", - "Train Epoch: 4 [5120/11263 (45%)]\tLoss: 0.652254\n", - "Train Epoch: 4 [5760/11263 (51%)]\tLoss: 0.631144\n", - "Train Epoch: 4 [6400/11263 (57%)]\tLoss: 0.702145\n", - "Train Epoch: 4 [7040/11263 (62%)]\tLoss: 0.601468\n", - "Train Epoch: 4 [7680/11263 (68%)]\tLoss: 0.567884\n", - "Train Epoch: 4 [8320/11263 (74%)]\tLoss: 0.487138\n", - "Train Epoch: 4 [8960/11263 (80%)]\tLoss: 0.673586\n", - "Train Epoch: 4 [9600/11263 (85%)]\tLoss: 0.492252\n", - "Train Epoch: 4 [10240/11263 (91%)]\tLoss: 0.645415\n", - "Train Epoch: 4 [10880/11263 (97%)]\tLoss: 0.587828\n", - "\n", - "Test set: Average loss: 2.6582\n", - "Class 0 accuracy: 731.0/980(75%)\n", - "Class 1 accuracy: 1086.0/1135(96%)\n", - "Class 2 accuracy: 631.0/1032(61%)\n", - "Class 3 accuracy: 293.0/1010(29%)\n", - "Class 4 accuracy: 959.0/982(98%)\n", - "Class 5 accuracy: 817.0/892(92%)\n", + "Train Epoch: 2 [0/11263 (0%)]\tLoss: 0.008444\n", + "Train Epoch: 2 [640/11263 (6%)]\tLoss: 0.020623\n", + "Train Epoch: 2 [1280/11263 (11%)]\tLoss: 0.028893\n", + "Train Epoch: 2 [1920/11263 (17%)]\tLoss: 0.025949\n", + "Train Epoch: 2 [2560/11263 (23%)]\tLoss: 0.027629\n", + "Train Epoch: 2 [3200/11263 (28%)]\tLoss: 0.012673\n", + "Train Epoch: 2 [3840/11263 (34%)]\tLoss: 0.132138\n", + "Train Epoch: 2 [4480/11263 (40%)]\tLoss: 0.019918\n", + "Train Epoch: 2 [5120/11263 (45%)]\tLoss: 0.040663\n", + "Train Epoch: 2 [5760/11263 (51%)]\tLoss: 0.072586\n", + "Train Epoch: 2 [6400/11263 (57%)]\tLoss: 0.027573\n", + "Train Epoch: 2 [7040/11263 (62%)]\tLoss: 0.010655\n", + "Train Epoch: 2 [7680/11263 (68%)]\tLoss: 0.007804\n", + "Train Epoch: 2 [8320/11263 (74%)]\tLoss: 0.021280\n", + "Train Epoch: 2 [8960/11263 (80%)]\tLoss: 0.038740\n", + "Train Epoch: 2 [9600/11263 (85%)]\tLoss: 0.005795\n", + "Train Epoch: 2 [10240/11263 (91%)]\tLoss: 0.005783\n", + "Train Epoch: 2 [10880/11263 (97%)]\tLoss: 0.049235\n", + "\n", + "Test set: Average loss: 5.5267\n", + "Class 0 accuracy: 647.0/980(66%)\n", + "Class 1 accuracy: 970.0/1135(85%)\n", + "Class 2 accuracy: 616.0/1032(60%)\n", + "Class 3 accuracy: 240.0/1010(24%)\n", + "Class 4 accuracy: 979.0/982(100%)\n", + "Class 5 accuracy: 876.0/892(98%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/11263 (0%)]\tLoss: 0.693316\n", - "Train Epoch: 5 [640/11263 (6%)]\tLoss: 0.579783\n", - "Train Epoch: 5 [1280/11263 (11%)]\tLoss: 0.606642\n", - "Train Epoch: 5 [1920/11263 (17%)]\tLoss: 0.578930\n", - "Train Epoch: 5 [2560/11263 (23%)]\tLoss: 0.593126\n", - "Train Epoch: 5 [3200/11263 (28%)]\tLoss: 0.568712\n", - "Train Epoch: 5 [3840/11263 (34%)]\tLoss: 0.730927\n", - "Train Epoch: 5 [4480/11263 (40%)]\tLoss: 0.517850\n", - "Train Epoch: 5 [5120/11263 (45%)]\tLoss: 0.595436\n", - "Train Epoch: 5 [5760/11263 (51%)]\tLoss: 0.623922\n", - "Train Epoch: 5 [6400/11263 (57%)]\tLoss: 0.477650\n", - "Train Epoch: 5 [7040/11263 (62%)]\tLoss: 0.672610\n", - "Train Epoch: 5 [7680/11263 (68%)]\tLoss: 0.543774\n", - "Train Epoch: 5 [8320/11263 (74%)]\tLoss: 0.580296\n", - "Train Epoch: 5 [8960/11263 (80%)]\tLoss: 0.583141\n", - "Train Epoch: 5 [9600/11263 (85%)]\tLoss: 0.448098\n", - "Train Epoch: 5 [10240/11263 (91%)]\tLoss: 0.625687\n", - "Train Epoch: 5 [10880/11263 (97%)]\tLoss: 0.533021\n", - "\n", - "Test set: Average loss: 2.7075\n", - "Class 0 accuracy: 719.0/980(73%)\n", - "Class 1 accuracy: 1080.0/1135(95%)\n", - "Class 2 accuracy: 629.0/1032(61%)\n", - "Class 3 accuracy: 287.0/1010(28%)\n", - "Class 4 accuracy: 959.0/982(98%)\n", - "Class 5 accuracy: 834.0/892(93%)\n", + "Train Epoch: 3 [0/11263 (0%)]\tLoss: 0.060683\n", + "Train Epoch: 3 [640/11263 (6%)]\tLoss: 0.049512\n", + "Train Epoch: 3 [1280/11263 (11%)]\tLoss: 0.034698\n", + "Train Epoch: 3 [1920/11263 (17%)]\tLoss: 0.015581\n", + "Train Epoch: 3 [2560/11263 (23%)]\tLoss: 0.097252\n", + "Train Epoch: 3 [3200/11263 (28%)]\tLoss: 0.022429\n", + "Train Epoch: 3 [3840/11263 (34%)]\tLoss: 0.021434\n", + "Train Epoch: 3 [4480/11263 (40%)]\tLoss: 0.030935\n", + "Train Epoch: 3 [5120/11263 (45%)]\tLoss: 0.055945\n", + "Train Epoch: 3 [5760/11263 (51%)]\tLoss: 0.032630\n", + "Train Epoch: 3 [6400/11263 (57%)]\tLoss: 0.010632\n", + "Train Epoch: 3 [7040/11263 (62%)]\tLoss: 0.014181\n", + "Train Epoch: 3 [7680/11263 (68%)]\tLoss: 0.011640\n", + "Train Epoch: 3 [8320/11263 (74%)]\tLoss: 0.022853\n", + "Train Epoch: 3 [8960/11263 (80%)]\tLoss: 0.011952\n", + "Train Epoch: 3 [9600/11263 (85%)]\tLoss: 0.029158\n", + "Train Epoch: 3 [10240/11263 (91%)]\tLoss: 0.005775\n", + "Train Epoch: 3 [10880/11263 (97%)]\tLoss: 0.044570\n", + "\n", + "Test set: Average loss: 6.0346\n", + "Class 0 accuracy: 662.0/980(68%)\n", + "Class 1 accuracy: 972.0/1135(86%)\n", + "Class 2 accuracy: 558.0/1032(54%)\n", + "Class 3 accuracy: 228.0/1010(23%)\n", + "Class 4 accuracy: 978.0/982(100%)\n", + "Class 5 accuracy: 883.0/892(99%)\n", "Class 6 accuracy: 0.0/958(0%)\n", "Class 7 accuracy: 0.0/1028(0%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/12183 (0%)]\tLoss: 0.851070\n", - "Train Epoch: 1 [640/12183 (5%)]\tLoss: 0.703527\n", - "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 0.862511\n", - "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 0.664779\n", - "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 0.622195\n", - "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 0.686788\n", - "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 0.766821\n", - "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 0.635133\n", - "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 0.673985\n", - "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 0.736285\n", - "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 0.763070\n", - "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 0.914076\n", - "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 0.897798\n", - "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 0.769690\n", - "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 0.705697\n", - "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 0.890666\n", - "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 0.964875\n", - "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 0.846083\n", - "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 0.977361\n", - "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 1.044579\n", - "\n", - "Test set: Average loss: 1.6683\n", - "Class 0 accuracy: 839.0/980(86%)\n", - "Class 1 accuracy: 1086.0/1135(96%)\n", - "Class 2 accuracy: 547.0/1032(53%)\n", - "Class 3 accuracy: 854.0/1010(85%)\n", - "Class 4 accuracy: 673.0/982(69%)\n", - "Class 5 accuracy: 311.0/892(35%)\n", - "Class 6 accuracy: 878.0/958(92%)\n", - "Class 7 accuracy: 904.0/1028(88%)\n", + "Train Epoch: 1 [0/12183 (0%)]\tLoss: 1.379911\n", + "Train Epoch: 1 [640/12183 (5%)]\tLoss: 0.125989\n", + "Train Epoch: 1 [1280/12183 (10%)]\tLoss: 0.938824\n", + "Train Epoch: 1 [1920/12183 (16%)]\tLoss: 0.376103\n", + "Train Epoch: 1 [2560/12183 (21%)]\tLoss: 0.235958\n", + "Train Epoch: 1 [3200/12183 (26%)]\tLoss: 0.146971\n", + "Train Epoch: 1 [3840/12183 (31%)]\tLoss: 0.261188\n", + "Train Epoch: 1 [4480/12183 (37%)]\tLoss: 0.162076\n", + "Train Epoch: 1 [5120/12183 (42%)]\tLoss: 0.064259\n", + "Train Epoch: 1 [5760/12183 (47%)]\tLoss: 0.127866\n", + "Train Epoch: 1 [6400/12183 (52%)]\tLoss: 0.153409\n", + "Train Epoch: 1 [7040/12183 (58%)]\tLoss: 0.117668\n", + "Train Epoch: 1 [7680/12183 (63%)]\tLoss: 0.058572\n", + "Train Epoch: 1 [8320/12183 (68%)]\tLoss: 0.084697\n", + "Train Epoch: 1 [8960/12183 (73%)]\tLoss: 0.034420\n", + "Train Epoch: 1 [9600/12183 (79%)]\tLoss: 0.017252\n", + "Train Epoch: 1 [10240/12183 (84%)]\tLoss: 0.020837\n", + "Train Epoch: 1 [10880/12183 (89%)]\tLoss: 0.022506\n", + "Train Epoch: 1 [11520/12183 (94%)]\tLoss: 0.073931\n", + "Train Epoch: 1 [4370/12183 (99%)]\tLoss: 0.032285\n", + "\n", + "Test set: Average loss: 2.6226\n", + "Class 0 accuracy: 668.0/980(68%)\n", + "Class 1 accuracy: 975.0/1135(86%)\n", + "Class 2 accuracy: 475.0/1032(46%)\n", + "Class 3 accuracy: 489.0/1010(48%)\n", + "Class 4 accuracy: 691.0/982(70%)\n", + "Class 5 accuracy: 564.0/892(63%)\n", + "Class 6 accuracy: 948.0/958(99%)\n", + "Class 7 accuracy: 1003.0/1028(98%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 2 [0/12183 (0%)]\tLoss: 0.782327\n", - "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.875331\n", - "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.926851\n", - "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.874468\n", - "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.925109\n", - "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.954436\n", - "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.942288\n", - "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.940796\n", - "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.857594\n", - "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 1.031697\n", - "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.929081\n", - "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.983720\n", - "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.876552\n", - "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.934435\n", - "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 1.003677\n", - "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.931277\n", - "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 1.008535\n", - "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.810847\n", - "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.702577\n", - "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.964019\n", - "\n", - "Test set: Average loss: 1.6425\n", - "Class 0 accuracy: 804.0/980(82%)\n", - "Class 1 accuracy: 1065.0/1135(94%)\n", - "Class 2 accuracy: 527.0/1032(51%)\n", - "Class 3 accuracy: 774.0/1010(77%)\n", - "Class 4 accuracy: 629.0/982(64%)\n", - "Class 5 accuracy: 347.0/892(39%)\n", - "Class 6 accuracy: 931.0/958(97%)\n", - "Class 7 accuracy: 983.0/1028(96%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.658189\n", - "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.624558\n", - "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.811082\n", - "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.653154\n", - "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.784420\n", - "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.620821\n", - "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.743391\n", - "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.694466\n", - "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.580736\n", - "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.673027\n", - "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.545014\n", - "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.924152\n", - "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.730344\n", - "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.724853\n", - "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.699868\n", - "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.697215\n", - "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.783108\n", - "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.672869\n", - "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.625879\n", - "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.598810\n", - "\n", - "Test set: Average loss: 1.6302\n", - "Class 0 accuracy: 797.0/980(81%)\n", - "Class 1 accuracy: 1062.0/1135(94%)\n", - "Class 2 accuracy: 526.0/1032(51%)\n", - "Class 3 accuracy: 762.0/1010(75%)\n", - "Class 4 accuracy: 657.0/982(67%)\n", - "Class 5 accuracy: 415.0/892(47%)\n", - "Class 6 accuracy: 938.0/958(98%)\n", - "Class 7 accuracy: 992.0/1028(96%)\n", - "Class 8 accuracy: 0.0/974(0%)\n", - "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 4 [0/12183 (0%)]\tLoss: 0.686760\n", - "Train Epoch: 4 [640/12183 (5%)]\tLoss: 0.678613\n", - "Train Epoch: 4 [1280/12183 (10%)]\tLoss: 0.649789\n", - "Train Epoch: 4 [1920/12183 (16%)]\tLoss: 0.512429\n", - "Train Epoch: 4 [2560/12183 (21%)]\tLoss: 0.689496\n", - "Train Epoch: 4 [3200/12183 (26%)]\tLoss: 0.608655\n", - "Train Epoch: 4 [3840/12183 (31%)]\tLoss: 0.553349\n", - "Train Epoch: 4 [4480/12183 (37%)]\tLoss: 0.538118\n", - "Train Epoch: 4 [5120/12183 (42%)]\tLoss: 0.461560\n", - "Train Epoch: 4 [5760/12183 (47%)]\tLoss: 0.588525\n", - "Train Epoch: 4 [6400/12183 (52%)]\tLoss: 0.508286\n", - "Train Epoch: 4 [7040/12183 (58%)]\tLoss: 0.540536\n", - "Train Epoch: 4 [7680/12183 (63%)]\tLoss: 0.479708\n", - "Train Epoch: 4 [8320/12183 (68%)]\tLoss: 0.501095\n", - "Train Epoch: 4 [8960/12183 (73%)]\tLoss: 0.469510\n", - "Train Epoch: 4 [9600/12183 (79%)]\tLoss: 0.497756\n", - "Train Epoch: 4 [10240/12183 (84%)]\tLoss: 0.523196\n", - "Train Epoch: 4 [10880/12183 (89%)]\tLoss: 0.555491\n", - "Train Epoch: 4 [11520/12183 (94%)]\tLoss: 0.515540\n", - "Train Epoch: 4 [4370/12183 (99%)]\tLoss: 0.572875\n", - "\n", - "Test set: Average loss: 1.6347\n", - "Class 0 accuracy: 788.0/980(80%)\n", - "Class 1 accuracy: 1063.0/1135(94%)\n", - "Class 2 accuracy: 534.0/1032(52%)\n", - "Class 3 accuracy: 769.0/1010(76%)\n", - "Class 4 accuracy: 672.0/982(68%)\n", - "Class 5 accuracy: 440.0/892(49%)\n", - "Class 6 accuracy: 940.0/958(98%)\n", - "Class 7 accuracy: 996.0/1028(97%)\n", + "Train Epoch: 2 [0/12183 (0%)]\tLoss: 0.045590\n", + "Train Epoch: 2 [640/12183 (5%)]\tLoss: 0.091010\n", + "Train Epoch: 2 [1280/12183 (10%)]\tLoss: 0.021004\n", + "Train Epoch: 2 [1920/12183 (16%)]\tLoss: 0.036341\n", + "Train Epoch: 2 [2560/12183 (21%)]\tLoss: 0.021020\n", + "Train Epoch: 2 [3200/12183 (26%)]\tLoss: 0.036480\n", + "Train Epoch: 2 [3840/12183 (31%)]\tLoss: 0.043549\n", + "Train Epoch: 2 [4480/12183 (37%)]\tLoss: 0.029598\n", + "Train Epoch: 2 [5120/12183 (42%)]\tLoss: 0.053440\n", + "Train Epoch: 2 [5760/12183 (47%)]\tLoss: 0.016025\n", + "Train Epoch: 2 [6400/12183 (52%)]\tLoss: 0.022595\n", + "Train Epoch: 2 [7040/12183 (58%)]\tLoss: 0.008219\n", + "Train Epoch: 2 [7680/12183 (63%)]\tLoss: 0.047070\n", + "Train Epoch: 2 [8320/12183 (68%)]\tLoss: 0.021060\n", + "Train Epoch: 2 [8960/12183 (73%)]\tLoss: 0.024627\n", + "Train Epoch: 2 [9600/12183 (79%)]\tLoss: 0.031155\n", + "Train Epoch: 2 [10240/12183 (84%)]\tLoss: 0.045095\n", + "Train Epoch: 2 [10880/12183 (89%)]\tLoss: 0.015965\n", + "Train Epoch: 2 [11520/12183 (94%)]\tLoss: 0.025968\n", + "Train Epoch: 2 [4370/12183 (99%)]\tLoss: 0.043935\n", + "\n", + "Test set: Average loss: 3.1688\n", + "Class 0 accuracy: 682.0/980(70%)\n", + "Class 1 accuracy: 969.0/1135(85%)\n", + "Class 2 accuracy: 480.0/1032(47%)\n", + "Class 3 accuracy: 471.0/1010(47%)\n", + "Class 4 accuracy: 635.0/982(65%)\n", + "Class 5 accuracy: 484.0/892(54%)\n", + "Class 6 accuracy: 950.0/958(99%)\n", + "Class 7 accuracy: 1013.0/1028(99%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 5 [0/12183 (0%)]\tLoss: 0.595143\n", - "Train Epoch: 5 [640/12183 (5%)]\tLoss: 0.550319\n", - "Train Epoch: 5 [1280/12183 (10%)]\tLoss: 0.548414\n", - "Train Epoch: 5 [1920/12183 (16%)]\tLoss: 0.511655\n", - "Train Epoch: 5 [2560/12183 (21%)]\tLoss: 0.401490\n", - "Train Epoch: 5 [3200/12183 (26%)]\tLoss: 0.400202\n", - "Train Epoch: 5 [3840/12183 (31%)]\tLoss: 0.397857\n", - "Train Epoch: 5 [4480/12183 (37%)]\tLoss: 0.479915\n", - "Train Epoch: 5 [5120/12183 (42%)]\tLoss: 0.408378\n", - "Train Epoch: 5 [5760/12183 (47%)]\tLoss: 0.431881\n", - "Train Epoch: 5 [6400/12183 (52%)]\tLoss: 0.429216\n", - "Train Epoch: 5 [7040/12183 (58%)]\tLoss: 0.347318\n", - "Train Epoch: 5 [7680/12183 (63%)]\tLoss: 0.549904\n", - "Train Epoch: 5 [8320/12183 (68%)]\tLoss: 0.484814\n", - "Train Epoch: 5 [8960/12183 (73%)]\tLoss: 0.430466\n", - "Train Epoch: 5 [9600/12183 (79%)]\tLoss: 0.517198\n", - "Train Epoch: 5 [10240/12183 (84%)]\tLoss: 0.395947\n", - "Train Epoch: 5 [10880/12183 (89%)]\tLoss: 0.551409\n", - "Train Epoch: 5 [11520/12183 (94%)]\tLoss: 0.495534\n", - "Train Epoch: 5 [4370/12183 (99%)]\tLoss: 0.495679\n", - "\n", - "Test set: Average loss: 1.6534\n", - "Class 0 accuracy: 781.0/980(80%)\n", - "Class 1 accuracy: 1059.0/1135(93%)\n", - "Class 2 accuracy: 530.0/1032(51%)\n", - "Class 3 accuracy: 763.0/1010(76%)\n", - "Class 4 accuracy: 672.0/982(68%)\n", - "Class 5 accuracy: 444.0/892(50%)\n", - "Class 6 accuracy: 940.0/958(98%)\n", - "Class 7 accuracy: 1001.0/1028(97%)\n", + "Train Epoch: 3 [0/12183 (0%)]\tLoss: 0.019614\n", + "Train Epoch: 3 [640/12183 (5%)]\tLoss: 0.059921\n", + "Train Epoch: 3 [1280/12183 (10%)]\tLoss: 0.018621\n", + "Train Epoch: 3 [1920/12183 (16%)]\tLoss: 0.011714\n", + "Train Epoch: 3 [2560/12183 (21%)]\tLoss: 0.014679\n", + "Train Epoch: 3 [3200/12183 (26%)]\tLoss: 0.012920\n", + "Train Epoch: 3 [3840/12183 (31%)]\tLoss: 0.022788\n", + "Train Epoch: 3 [4480/12183 (37%)]\tLoss: 0.016748\n", + "Train Epoch: 3 [5120/12183 (42%)]\tLoss: 0.028296\n", + "Train Epoch: 3 [5760/12183 (47%)]\tLoss: 0.021148\n", + "Train Epoch: 3 [6400/12183 (52%)]\tLoss: 0.008148\n", + "Train Epoch: 3 [7040/12183 (58%)]\tLoss: 0.011808\n", + "Train Epoch: 3 [7680/12183 (63%)]\tLoss: 0.009274\n", + "Train Epoch: 3 [8320/12183 (68%)]\tLoss: 0.011613\n", + "Train Epoch: 3 [8960/12183 (73%)]\tLoss: 0.013502\n", + "Train Epoch: 3 [9600/12183 (79%)]\tLoss: 0.022795\n", + "Train Epoch: 3 [10240/12183 (84%)]\tLoss: 0.013261\n", + "Train Epoch: 3 [10880/12183 (89%)]\tLoss: 0.026117\n", + "Train Epoch: 3 [11520/12183 (94%)]\tLoss: 0.004542\n", + "Train Epoch: 3 [4370/12183 (99%)]\tLoss: 0.002898\n", + "\n", + "Test set: Average loss: 3.5287\n", + "Class 0 accuracy: 636.0/980(65%)\n", + "Class 1 accuracy: 955.0/1135(84%)\n", + "Class 2 accuracy: 451.0/1032(44%)\n", + "Class 3 accuracy: 432.0/1010(43%)\n", + "Class 4 accuracy: 562.0/982(57%)\n", + "Class 5 accuracy: 458.0/892(51%)\n", + "Class 6 accuracy: 952.0/958(99%)\n", + "Class 7 accuracy: 1018.0/1028(99%)\n", "Class 8 accuracy: 0.0/974(0%)\n", "Class 9 accuracy: 0.0/1009(0%)\n", - "Train Epoch: 1 [0/11800 (0%)]\tLoss: 0.848253\n", - "Train Epoch: 1 [640/11800 (5%)]\tLoss: 0.637744\n", - "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 0.628570\n", - "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 0.461403\n", - "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 0.513085\n", - "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 0.590126\n", - "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 0.472829\n", - "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 0.592700\n", - "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 0.617516\n", - "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 0.555048\n", - "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 0.743809\n", - "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 0.765445\n", - "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 0.768416\n", - "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 0.777279\n", - "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 0.842107\n", - "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 0.796940\n", - "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 0.601572\n", - "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 0.841399\n", - "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 0.846165\n", - "\n", - "Test set: Average loss: 0.9925\n", - "Class 0 accuracy: 835.0/980(85%)\n", - "Class 1 accuracy: 1050.0/1135(93%)\n", - "Class 2 accuracy: 638.0/1032(62%)\n", - "Class 3 accuracy: 738.0/1010(73%)\n", - "Class 4 accuracy: 548.0/982(56%)\n", - "Class 5 accuracy: 170.0/892(19%)\n", - "Class 6 accuracy: 779.0/958(81%)\n", - "Class 7 accuracy: 776.0/1028(75%)\n", - "Class 8 accuracy: 908.0/974(93%)\n", - "Class 9 accuracy: 801.0/1009(79%)\n", - "Train Epoch: 2 [0/11800 (0%)]\tLoss: 0.883257\n", - "Train Epoch: 2 [640/11800 (5%)]\tLoss: 0.857211\n", - "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 0.841614\n", - "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 0.790240\n", - "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 0.950122\n", - "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 0.835133\n", - "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.882796\n", - "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.810285\n", - "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.799711\n", - "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.834429\n", - "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.839871\n", - "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.947290\n", - "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.710232\n", - "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.779843\n", - "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.733478\n", - "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.938040\n", - "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.839119\n", - "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.696384\n", - "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.752226\n", - "\n", - "Test set: Average loss: 0.9674\n", - "Class 0 accuracy: 825.0/980(84%)\n", - "Class 1 accuracy: 1004.0/1135(88%)\n", - "Class 2 accuracy: 599.0/1032(58%)\n", - "Class 3 accuracy: 615.0/1010(61%)\n", - "Class 4 accuracy: 332.0/982(34%)\n", - "Class 5 accuracy: 42.0/892(5%)\n", - "Class 6 accuracy: 762.0/958(80%)\n", - "Class 7 accuracy: 623.0/1028(61%)\n", - "Class 8 accuracy: 943.0/974(97%)\n", - "Class 9 accuracy: 923.0/1009(91%)\n", - "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.708711\n", - "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.783265\n", - "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.810831\n", - "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.753713\n", - "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.696868\n", - "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.572866\n", - "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.757275\n", - "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.732344\n", - "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.671541\n", - "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.724425\n", - "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.719062\n", - "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.712015\n", - "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.619695\n", - "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.781576\n", - "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.707311\n", - "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.700315\n", - "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.579610\n", - "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.836607\n", - "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.599106\n", - "\n", - "Test set: Average loss: 0.9365\n", - "Class 0 accuracy: 817.0/980(83%)\n", - "Class 1 accuracy: 996.0/1135(88%)\n", - "Class 2 accuracy: 598.0/1032(58%)\n", - "Class 3 accuracy: 612.0/1010(61%)\n", - "Class 4 accuracy: 291.0/982(30%)\n", - "Class 5 accuracy: 58.0/892(7%)\n", - "Class 6 accuracy: 772.0/958(81%)\n", - "Class 7 accuracy: 574.0/1028(56%)\n", - "Class 8 accuracy: 941.0/974(97%)\n", - "Class 9 accuracy: 948.0/1009(94%)\n", - "Train Epoch: 4 [0/11800 (0%)]\tLoss: 0.764324\n", - "Train Epoch: 4 [640/11800 (5%)]\tLoss: 0.750924\n", - "Train Epoch: 4 [1280/11800 (11%)]\tLoss: 0.597976\n", - "Train Epoch: 4 [1920/11800 (16%)]\tLoss: 0.711546\n", - "Train Epoch: 4 [2560/11800 (22%)]\tLoss: 0.744140\n", - "Train Epoch: 4 [3200/11800 (27%)]\tLoss: 0.756678\n", - "Train Epoch: 4 [3840/11800 (32%)]\tLoss: 0.566600\n", - "Train Epoch: 4 [4480/11800 (38%)]\tLoss: 0.728696\n", - "Train Epoch: 4 [5120/11800 (43%)]\tLoss: 0.720701\n", - "Train Epoch: 4 [5760/11800 (49%)]\tLoss: 0.566305\n", - "Train Epoch: 4 [6400/11800 (54%)]\tLoss: 0.689037\n", - "Train Epoch: 4 [7040/11800 (59%)]\tLoss: 0.678461\n", - "Train Epoch: 4 [7680/11800 (65%)]\tLoss: 0.550391\n", - "Train Epoch: 4 [8320/11800 (70%)]\tLoss: 0.694139\n", - "Train Epoch: 4 [8960/11800 (76%)]\tLoss: 0.700623\n", - "Train Epoch: 4 [9600/11800 (81%)]\tLoss: 0.623185\n", - "Train Epoch: 4 [10240/11800 (86%)]\tLoss: 0.696449\n", - "Train Epoch: 4 [10880/11800 (92%)]\tLoss: 0.732011\n", - "Train Epoch: 4 [11520/11800 (97%)]\tLoss: 0.734793\n", - "\n", - "Test set: Average loss: 0.9336\n", - "Class 0 accuracy: 809.0/980(83%)\n", - "Class 1 accuracy: 986.0/1135(87%)\n", - "Class 2 accuracy: 593.0/1032(57%)\n", - "Class 3 accuracy: 575.0/1010(57%)\n", - "Class 4 accuracy: 283.0/982(29%)\n", - "Class 5 accuracy: 60.0/892(7%)\n", - "Class 6 accuracy: 772.0/958(81%)\n", - "Class 7 accuracy: 550.0/1028(54%)\n", - "Class 8 accuracy: 943.0/974(97%)\n", - "Class 9 accuracy: 956.0/1009(95%)\n", - "Train Epoch: 5 [0/11800 (0%)]\tLoss: 0.598379\n", - "Train Epoch: 5 [640/11800 (5%)]\tLoss: 0.805639\n", - "Train Epoch: 5 [1280/11800 (11%)]\tLoss: 0.687005\n", - "Train Epoch: 5 [1920/11800 (16%)]\tLoss: 0.553637\n", - "Train Epoch: 5 [2560/11800 (22%)]\tLoss: 0.630970\n", - "Train Epoch: 5 [3200/11800 (27%)]\tLoss: 0.618934\n", - "Train Epoch: 5 [3840/11800 (32%)]\tLoss: 0.695465\n", - "Train Epoch: 5 [4480/11800 (38%)]\tLoss: 0.617699\n", - "Train Epoch: 5 [5120/11800 (43%)]\tLoss: 0.745449\n", - "Train Epoch: 5 [5760/11800 (49%)]\tLoss: 0.529404\n", - "Train Epoch: 5 [6400/11800 (54%)]\tLoss: 0.633640\n", - "Train Epoch: 5 [7040/11800 (59%)]\tLoss: 0.788254\n", - "Train Epoch: 5 [7680/11800 (65%)]\tLoss: 0.565721\n", - "Train Epoch: 5 [8320/11800 (70%)]\tLoss: 0.707190\n", - "Train Epoch: 5 [8960/11800 (76%)]\tLoss: 0.583630\n", - "Train Epoch: 5 [9600/11800 (81%)]\tLoss: 0.549434\n", - "Train Epoch: 5 [10240/11800 (86%)]\tLoss: 0.546574\n", - "Train Epoch: 5 [10880/11800 (92%)]\tLoss: 0.536187\n", - "Train Epoch: 5 [11520/11800 (97%)]\tLoss: 0.731755\n", - "\n", - "Test set: Average loss: 0.9307\n", - "Class 0 accuracy: 807.0/980(82%)\n", - "Class 1 accuracy: 977.0/1135(86%)\n", - "Class 2 accuracy: 588.0/1032(57%)\n", - "Class 3 accuracy: 548.0/1010(54%)\n", - "Class 4 accuracy: 283.0/982(29%)\n", - "Class 5 accuracy: 70.0/892(8%)\n", - "Class 6 accuracy: 772.0/958(81%)\n", - "Class 7 accuracy: 546.0/1028(53%)\n", + "Train Epoch: 1 [0/11800 (0%)]\tLoss: 0.473740\n", + "Train Epoch: 1 [640/11800 (5%)]\tLoss: 0.210103\n", + "Train Epoch: 1 [1280/11800 (11%)]\tLoss: 0.418402\n", + "Train Epoch: 1 [1920/11800 (16%)]\tLoss: 0.530582\n", + "Train Epoch: 1 [2560/11800 (22%)]\tLoss: 0.304206\n", + "Train Epoch: 1 [3200/11800 (27%)]\tLoss: 0.122092\n", + "Train Epoch: 1 [3840/11800 (32%)]\tLoss: 0.183575\n", + "Train Epoch: 1 [4480/11800 (38%)]\tLoss: 0.260152\n", + "Train Epoch: 1 [5120/11800 (43%)]\tLoss: 0.277376\n", + "Train Epoch: 1 [5760/11800 (49%)]\tLoss: 0.212683\n", + "Train Epoch: 1 [6400/11800 (54%)]\tLoss: 0.163834\n", + "Train Epoch: 1 [7040/11800 (59%)]\tLoss: 0.088070\n", + "Train Epoch: 1 [7680/11800 (65%)]\tLoss: 0.092493\n", + "Train Epoch: 1 [8320/11800 (70%)]\tLoss: 0.169504\n", + "Train Epoch: 1 [8960/11800 (76%)]\tLoss: 0.130592\n", + "Train Epoch: 1 [9600/11800 (81%)]\tLoss: 0.043165\n", + "Train Epoch: 1 [10240/11800 (86%)]\tLoss: 0.051642\n", + "Train Epoch: 1 [10880/11800 (92%)]\tLoss: 0.081378\n", + "Train Epoch: 1 [11520/11800 (97%)]\tLoss: 0.073074\n", + "\n", + "Test set: Average loss: 1.1909\n", + "Class 0 accuracy: 710.0/980(72%)\n", + "Class 1 accuracy: 937.0/1135(83%)\n", + "Class 2 accuracy: 525.0/1032(51%)\n", + "Class 3 accuracy: 409.0/1010(40%)\n", + "Class 4 accuracy: 368.0/982(37%)\n", + "Class 5 accuracy: 359.0/892(40%)\n", + "Class 6 accuracy: 782.0/958(82%)\n", + "Class 7 accuracy: 587.0/1028(57%)\n", "Class 8 accuracy: 945.0/974(97%)\n", - "Class 9 accuracy: 958.0/1009(95%)\n", - "Train Epoch: 1 [0/12665 (0%)]\tLoss: 0.606930\n", - "Train Epoch: 1 [640/12665 (5%)]\tLoss: 0.566195\n", - "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 0.488845\n", - "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.440726\n", - "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.412488\n", - "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.525131\n", - "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.394614\n", - "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.449948\n", - "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.455428\n", - "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.374721\n", - "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.441609\n", - "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.499441\n", - "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.482373\n", - "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.431031\n", - "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.455554\n", - "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.415438\n", - "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.355638\n", - "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.477118\n", - "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.512437\n", - "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.351764\n", - "\n", - "Test set: Average loss: 0.8019\n", - "Class 0 accuracy: 968.0/980(99%)\n", - "Class 1 accuracy: 1130.0/1135(100%)\n", - "Class 2 accuracy: 604.0/1032(59%)\n", - "Class 3 accuracy: 753.0/1010(75%)\n", - "Class 4 accuracy: 673.0/982(69%)\n", - "Class 5 accuracy: 496.0/892(56%)\n", - "Class 6 accuracy: 695.0/958(73%)\n", - "Class 7 accuracy: 825.0/1028(80%)\n", - "Class 8 accuracy: 589.0/974(60%)\n", - "Class 9 accuracy: 751.0/1009(74%)\n", - "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.382221\n", - "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.359024\n", - "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.443718\n", - "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.352842\n", - "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.390380\n", - "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.450553\n", - "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.285430\n", - "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.317991\n", - "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.304995\n", - "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.402834\n", - "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.410913\n", - "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.323035\n", - "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.359033\n", - "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.332048\n", - "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.344597\n", - "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.363583\n", - "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.267385\n", - "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.303813\n", - "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.394272\n", - "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.275770\n", - "\n", - "Test set: Average loss: 0.7998\n", - "Class 0 accuracy: 970.0/980(99%)\n", - "Class 1 accuracy: 1130.0/1135(100%)\n", - "Class 2 accuracy: 586.0/1032(57%)\n", - "Class 3 accuracy: 743.0/1010(74%)\n", - "Class 4 accuracy: 675.0/982(69%)\n", - "Class 5 accuracy: 498.0/892(56%)\n", - "Class 6 accuracy: 686.0/958(72%)\n", - "Class 7 accuracy: 819.0/1028(80%)\n", - "Class 8 accuracy: 607.0/974(62%)\n", - "Class 9 accuracy: 756.0/1009(75%)\n", - "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.361247\n", - "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.295900\n", - "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.298250\n", - "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.288731\n", - "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.304051\n", - "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.301107\n", - "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.264046\n", - "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.236352\n", - "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.251096\n", - "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.369783\n", - "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.356867\n", - "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.247389\n", - "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.264304\n", - "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.243768\n", - "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.328787\n", - "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.294538\n", - "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.300040\n", - "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.258787\n", - "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.283641\n", - "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.338280\n", - "\n", - "Test set: Average loss: 0.7930\n", - "Class 0 accuracy: 971.0/980(99%)\n", - "Class 1 accuracy: 1130.0/1135(100%)\n", - "Class 2 accuracy: 589.0/1032(57%)\n", - "Class 3 accuracy: 741.0/1010(73%)\n", - "Class 4 accuracy: 671.0/982(68%)\n", - "Class 5 accuracy: 516.0/892(58%)\n", - "Class 6 accuracy: 685.0/958(72%)\n", - "Class 7 accuracy: 813.0/1028(79%)\n", - "Class 8 accuracy: 608.0/974(62%)\n", - "Class 9 accuracy: 755.0/1009(75%)\n", - "Train Epoch: 4 [0/12665 (0%)]\tLoss: 0.236698\n", - "Train Epoch: 4 [640/12665 (5%)]\tLoss: 0.221445\n", - "Train Epoch: 4 [1280/12665 (10%)]\tLoss: 0.236138\n", - "Train Epoch: 4 [1920/12665 (15%)]\tLoss: 0.257844\n", - "Train Epoch: 4 [2560/12665 (20%)]\tLoss: 0.233735\n", - "Train Epoch: 4 [3200/12665 (25%)]\tLoss: 0.222089\n", - "Train Epoch: 4 [3840/12665 (30%)]\tLoss: 0.307528\n", - "Train Epoch: 4 [4480/12665 (35%)]\tLoss: 0.285662\n", - "Train Epoch: 4 [5120/12665 (40%)]\tLoss: 0.240001\n", - "Train Epoch: 4 [5760/12665 (45%)]\tLoss: 0.292137\n", - "Train Epoch: 4 [6400/12665 (51%)]\tLoss: 0.290430\n", - "Train Epoch: 4 [7040/12665 (56%)]\tLoss: 0.299295\n", - "Train Epoch: 4 [7680/12665 (61%)]\tLoss: 0.255210\n", - "Train Epoch: 4 [8320/12665 (66%)]\tLoss: 0.203961\n", - "Train Epoch: 4 [8960/12665 (71%)]\tLoss: 0.238729\n", - "Train Epoch: 4 [9600/12665 (76%)]\tLoss: 0.249784\n", - "Train Epoch: 4 [10240/12665 (81%)]\tLoss: 0.193929\n", - "Train Epoch: 4 [10880/12665 (86%)]\tLoss: 0.198174\n", - "Train Epoch: 4 [11520/12665 (91%)]\tLoss: 0.270540\n", - "Train Epoch: 4 [12160/12665 (96%)]\tLoss: 0.217733\n", - "\n", - "Test set: Average loss: 0.8017\n", - "Class 0 accuracy: 971.0/980(99%)\n", - "Class 1 accuracy: 1130.0/1135(100%)\n", - "Class 2 accuracy: 575.0/1032(56%)\n", - "Class 3 accuracy: 736.0/1010(73%)\n", - "Class 4 accuracy: 671.0/982(68%)\n", - "Class 5 accuracy: 511.0/892(57%)\n", - "Class 6 accuracy: 682.0/958(71%)\n", - "Class 7 accuracy: 814.0/1028(79%)\n", - "Class 8 accuracy: 607.0/974(62%)\n", - "Class 9 accuracy: 750.0/1009(74%)\n", - "Train Epoch: 5 [0/12665 (0%)]\tLoss: 0.226164\n", - "Train Epoch: 5 [640/12665 (5%)]\tLoss: 0.318618\n", - "Train Epoch: 5 [1280/12665 (10%)]\tLoss: 0.238432\n", - "Train Epoch: 5 [1920/12665 (15%)]\tLoss: 0.262093\n", - "Train Epoch: 5 [2560/12665 (20%)]\tLoss: 0.286501\n", - "Train Epoch: 5 [3200/12665 (25%)]\tLoss: 0.219213\n", - "Train Epoch: 5 [3840/12665 (30%)]\tLoss: 0.250186\n", - "Train Epoch: 5 [4480/12665 (35%)]\tLoss: 0.270830\n", - "Train Epoch: 5 [5120/12665 (40%)]\tLoss: 0.149153\n", - "Train Epoch: 5 [5760/12665 (45%)]\tLoss: 0.206908\n", - "Train Epoch: 5 [6400/12665 (51%)]\tLoss: 0.237038\n", - "Train Epoch: 5 [7040/12665 (56%)]\tLoss: 0.289587\n", - "Train Epoch: 5 [7680/12665 (61%)]\tLoss: 0.243903\n", - "Train Epoch: 5 [8320/12665 (66%)]\tLoss: 0.234777\n", - "Train Epoch: 5 [8960/12665 (71%)]\tLoss: 0.194367\n", - "Train Epoch: 5 [9600/12665 (76%)]\tLoss: 0.248726\n", - "Train Epoch: 5 [10240/12665 (81%)]\tLoss: 0.233232\n", - "Train Epoch: 5 [10880/12665 (86%)]\tLoss: 0.258024\n", - "Train Epoch: 5 [11520/12665 (91%)]\tLoss: 0.280726\n", - "Train Epoch: 5 [12160/12665 (96%)]\tLoss: 0.206879\n", - "\n", - "Test set: Average loss: 0.8039\n", - "Class 0 accuracy: 971.0/980(99%)\n", - "Class 1 accuracy: 1130.0/1135(100%)\n", - "Class 2 accuracy: 575.0/1032(56%)\n", - "Class 3 accuracy: 739.0/1010(73%)\n", - "Class 4 accuracy: 672.0/982(68%)\n", - "Class 5 accuracy: 520.0/892(58%)\n", - "Class 6 accuracy: 676.0/958(71%)\n", - "Class 7 accuracy: 812.0/1028(79%)\n", - "Class 8 accuracy: 597.0/974(61%)\n", - "Class 9 accuracy: 746.0/1009(74%)\n" + "Class 9 accuracy: 974.0/1009(97%)\n", + "Train Epoch: 2 [0/11800 (0%)]\tLoss: 0.106367\n", + "Train Epoch: 2 [640/11800 (5%)]\tLoss: 0.110765\n", + "Train Epoch: 2 [1280/11800 (11%)]\tLoss: 0.168906\n", + "Train Epoch: 2 [1920/11800 (16%)]\tLoss: 0.130259\n", + "Train Epoch: 2 [2560/11800 (22%)]\tLoss: 0.099700\n", + "Train Epoch: 2 [3200/11800 (27%)]\tLoss: 0.045566\n", + "Train Epoch: 2 [3840/11800 (32%)]\tLoss: 0.032498\n", + "Train Epoch: 2 [4480/11800 (38%)]\tLoss: 0.127420\n", + "Train Epoch: 2 [5120/11800 (43%)]\tLoss: 0.127244\n", + "Train Epoch: 2 [5760/11800 (49%)]\tLoss: 0.123305\n", + "Train Epoch: 2 [6400/11800 (54%)]\tLoss: 0.033301\n", + "Train Epoch: 2 [7040/11800 (59%)]\tLoss: 0.050663\n", + "Train Epoch: 2 [7680/11800 (65%)]\tLoss: 0.029956\n", + "Train Epoch: 2 [8320/11800 (70%)]\tLoss: 0.016801\n", + "Train Epoch: 2 [8960/11800 (76%)]\tLoss: 0.067689\n", + "Train Epoch: 2 [9600/11800 (81%)]\tLoss: 0.044518\n", + "Train Epoch: 2 [10240/11800 (86%)]\tLoss: 0.073524\n", + "Train Epoch: 2 [10880/11800 (92%)]\tLoss: 0.035689\n", + "Train Epoch: 2 [11520/11800 (97%)]\tLoss: 0.084134\n", + "\n", + "Test set: Average loss: 1.5479\n", + "Class 0 accuracy: 684.0/980(70%)\n", + "Class 1 accuracy: 893.0/1135(79%)\n", + "Class 2 accuracy: 470.0/1032(46%)\n", + "Class 3 accuracy: 346.0/1010(34%)\n", + "Class 4 accuracy: 312.0/982(32%)\n", + "Class 5 accuracy: 298.0/892(33%)\n", + "Class 6 accuracy: 758.0/958(79%)\n", + "Class 7 accuracy: 583.0/1028(57%)\n", + "Class 8 accuracy: 953.0/974(98%)\n", + "Class 9 accuracy: 977.0/1009(97%)\n", + "Train Epoch: 3 [0/11800 (0%)]\tLoss: 0.106828\n", + "Train Epoch: 3 [640/11800 (5%)]\tLoss: 0.064151\n", + "Train Epoch: 3 [1280/11800 (11%)]\tLoss: 0.064141\n", + "Train Epoch: 3 [1920/11800 (16%)]\tLoss: 0.046738\n", + "Train Epoch: 3 [2560/11800 (22%)]\tLoss: 0.060965\n", + "Train Epoch: 3 [3200/11800 (27%)]\tLoss: 0.041177\n", + "Train Epoch: 3 [3840/11800 (32%)]\tLoss: 0.015125\n", + "Train Epoch: 3 [4480/11800 (38%)]\tLoss: 0.036628\n", + "Train Epoch: 3 [5120/11800 (43%)]\tLoss: 0.040213\n", + "Train Epoch: 3 [5760/11800 (49%)]\tLoss: 0.038948\n", + "Train Epoch: 3 [6400/11800 (54%)]\tLoss: 0.065069\n", + "Train Epoch: 3 [7040/11800 (59%)]\tLoss: 0.060684\n", + "Train Epoch: 3 [7680/11800 (65%)]\tLoss: 0.051811\n", + "Train Epoch: 3 [8320/11800 (70%)]\tLoss: 0.096974\n", + "Train Epoch: 3 [8960/11800 (76%)]\tLoss: 0.014142\n", + "Train Epoch: 3 [9600/11800 (81%)]\tLoss: 0.068916\n", + "Train Epoch: 3 [10240/11800 (86%)]\tLoss: 0.047880\n", + "Train Epoch: 3 [10880/11800 (92%)]\tLoss: 0.007572\n", + "Train Epoch: 3 [11520/11800 (97%)]\tLoss: 0.025779\n", + "\n", + "Test set: Average loss: 1.6151\n", + "Class 0 accuracy: 647.0/980(66%)\n", + "Class 1 accuracy: 885.0/1135(78%)\n", + "Class 2 accuracy: 492.0/1032(48%)\n", + "Class 3 accuracy: 379.0/1010(38%)\n", + "Class 4 accuracy: 323.0/982(33%)\n", + "Class 5 accuracy: 310.0/892(35%)\n", + "Class 6 accuracy: 736.0/958(77%)\n", + "Class 7 accuracy: 546.0/1028(53%)\n", + "Class 8 accuracy: 961.0/974(99%)\n", + "Class 9 accuracy: 976.0/1009(97%)\n", + "Train Epoch: 1 [0/12665 (0%)]\tLoss: 0.030852\n", + "Train Epoch: 1 [640/12665 (5%)]\tLoss: 0.051628\n", + "Train Epoch: 1 [1280/12665 (10%)]\tLoss: 0.097404\n", + "Train Epoch: 1 [1920/12665 (15%)]\tLoss: 0.066156\n", + "Train Epoch: 1 [2560/12665 (20%)]\tLoss: 0.085003\n", + "Train Epoch: 1 [3200/12665 (25%)]\tLoss: 0.022351\n", + "Train Epoch: 1 [3840/12665 (30%)]\tLoss: 0.047033\n", + "Train Epoch: 1 [4480/12665 (35%)]\tLoss: 0.021085\n", + "Train Epoch: 1 [5120/12665 (40%)]\tLoss: 0.038875\n", + "Train Epoch: 1 [5760/12665 (45%)]\tLoss: 0.035716\n", + "Train Epoch: 1 [6400/12665 (51%)]\tLoss: 0.033066\n", + "Train Epoch: 1 [7040/12665 (56%)]\tLoss: 0.020775\n", + "Train Epoch: 1 [7680/12665 (61%)]\tLoss: 0.027079\n", + "Train Epoch: 1 [8320/12665 (66%)]\tLoss: 0.071041\n", + "Train Epoch: 1 [8960/12665 (71%)]\tLoss: 0.030695\n", + "Train Epoch: 1 [9600/12665 (76%)]\tLoss: 0.038757\n", + "Train Epoch: 1 [10240/12665 (81%)]\tLoss: 0.003501\n", + "Train Epoch: 1 [10880/12665 (86%)]\tLoss: 0.011310\n", + "Train Epoch: 1 [11520/12665 (91%)]\tLoss: 0.057821\n", + "Train Epoch: 1 [12160/12665 (96%)]\tLoss: 0.016945\n", + "\n", + "Test set: Average loss: 1.3637\n", + "Class 0 accuracy: 977.0/980(100%)\n", + "Class 1 accuracy: 1133.0/1135(100%)\n", + "Class 2 accuracy: 574.0/1032(56%)\n", + "Class 3 accuracy: 561.0/1010(56%)\n", + "Class 4 accuracy: 494.0/982(50%)\n", + "Class 5 accuracy: 328.0/892(37%)\n", + "Class 6 accuracy: 656.0/958(68%)\n", + "Class 7 accuracy: 753.0/1028(73%)\n", + "Class 8 accuracy: 701.0/974(72%)\n", + "Class 9 accuracy: 866.0/1009(86%)\n", + "Train Epoch: 2 [0/12665 (0%)]\tLoss: 0.016473\n", + "Train Epoch: 2 [640/12665 (5%)]\tLoss: 0.007508\n", + "Train Epoch: 2 [1280/12665 (10%)]\tLoss: 0.037633\n", + "Train Epoch: 2 [1920/12665 (15%)]\tLoss: 0.026398\n", + "Train Epoch: 2 [2560/12665 (20%)]\tLoss: 0.004491\n", + "Train Epoch: 2 [3200/12665 (25%)]\tLoss: 0.002447\n", + "Train Epoch: 2 [3840/12665 (30%)]\tLoss: 0.007396\n", + "Train Epoch: 2 [4480/12665 (35%)]\tLoss: 0.022243\n", + "Train Epoch: 2 [5120/12665 (40%)]\tLoss: 0.032471\n", + "Train Epoch: 2 [5760/12665 (45%)]\tLoss: 0.012960\n", + "Train Epoch: 2 [6400/12665 (51%)]\tLoss: 0.009143\n", + "Train Epoch: 2 [7040/12665 (56%)]\tLoss: 0.005618\n", + "Train Epoch: 2 [7680/12665 (61%)]\tLoss: 0.016858\n", + "Train Epoch: 2 [8320/12665 (66%)]\tLoss: 0.015019\n", + "Train Epoch: 2 [8960/12665 (71%)]\tLoss: 0.042326\n", + "Train Epoch: 2 [9600/12665 (76%)]\tLoss: 0.005700\n", + "Train Epoch: 2 [10240/12665 (81%)]\tLoss: 0.020611\n", + "Train Epoch: 2 [10880/12665 (86%)]\tLoss: 0.011131\n", + "Train Epoch: 2 [11520/12665 (91%)]\tLoss: 0.019555\n", + "Train Epoch: 2 [12160/12665 (96%)]\tLoss: 0.015460\n", + "\n", + "Test set: Average loss: 1.5375\n", + "Class 0 accuracy: 977.0/980(100%)\n", + "Class 1 accuracy: 1133.0/1135(100%)\n", + "Class 2 accuracy: 500.0/1032(48%)\n", + "Class 3 accuracy: 503.0/1010(50%)\n", + "Class 4 accuracy: 489.0/982(50%)\n", + "Class 5 accuracy: 362.0/892(41%)\n", + "Class 6 accuracy: 639.0/958(67%)\n", + "Class 7 accuracy: 746.0/1028(73%)\n", + "Class 8 accuracy: 657.0/974(67%)\n", + "Class 9 accuracy: 847.0/1009(84%)\n", + "Train Epoch: 3 [0/12665 (0%)]\tLoss: 0.003884\n", + "Train Epoch: 3 [640/12665 (5%)]\tLoss: 0.024282\n", + "Train Epoch: 3 [1280/12665 (10%)]\tLoss: 0.007995\n", + "Train Epoch: 3 [1920/12665 (15%)]\tLoss: 0.006038\n", + "Train Epoch: 3 [2560/12665 (20%)]\tLoss: 0.007882\n", + "Train Epoch: 3 [3200/12665 (25%)]\tLoss: 0.008968\n", + "Train Epoch: 3 [3840/12665 (30%)]\tLoss: 0.007985\n", + "Train Epoch: 3 [4480/12665 (35%)]\tLoss: 0.017382\n", + "Train Epoch: 3 [5120/12665 (40%)]\tLoss: 0.006549\n", + "Train Epoch: 3 [5760/12665 (45%)]\tLoss: 0.006111\n", + "Train Epoch: 3 [6400/12665 (51%)]\tLoss: 0.016712\n", + "Train Epoch: 3 [7040/12665 (56%)]\tLoss: 0.009508\n", + "Train Epoch: 3 [7680/12665 (61%)]\tLoss: 0.013591\n", + "Train Epoch: 3 [8320/12665 (66%)]\tLoss: 0.002323\n", + "Train Epoch: 3 [8960/12665 (71%)]\tLoss: 0.003972\n", + "Train Epoch: 3 [9600/12665 (76%)]\tLoss: 0.002240\n", + "Train Epoch: 3 [10240/12665 (81%)]\tLoss: 0.012233\n", + "Train Epoch: 3 [10880/12665 (86%)]\tLoss: 0.046749\n", + "Train Epoch: 3 [11520/12665 (91%)]\tLoss: 0.006683\n", + "Train Epoch: 3 [12160/12665 (96%)]\tLoss: 0.006137\n", + "\n", + "Test set: Average loss: 1.5670\n", + "Class 0 accuracy: 976.0/980(100%)\n", + "Class 1 accuracy: 1134.0/1135(100%)\n", + "Class 2 accuracy: 509.0/1032(49%)\n", + "Class 3 accuracy: 520.0/1010(51%)\n", + "Class 4 accuracy: 496.0/982(51%)\n", + "Class 5 accuracy: 355.0/892(40%)\n", + "Class 6 accuracy: 625.0/958(65%)\n", + "Class 7 accuracy: 743.0/1028(72%)\n", + "Class 8 accuracy: 654.0/974(67%)\n", + "Class 9 accuracy: 854.0/1009(85%)\n" ] + }, + { + "output_type": "execute_result", + "data": { + "text/plain": [ + "[{0: 0.9959183673469387,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.9959183673469387,\n", + " 1: 1.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.996938775510204,\n", + " 1: 1.0,\n", + " 2: 0.0,\n", + " 3: 0.0,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '0_1'},\n", + " {0: 0.8459183673469388,\n", + " 1: 0.9215859030837005,\n", + " 2: 0.9602713178294574,\n", + " 3: 0.9732673267326732,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.7795918367346939,\n", + " 1: 0.8801762114537445,\n", + " 2: 0.9689922480620154,\n", + " 3: 0.9782178217821782,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.7377551020408163,\n", + " 1: 0.852863436123348,\n", + " 2: 0.9680232558139535,\n", + " 3: 0.9821782178217822,\n", + " 4: 0.0,\n", + " 5: 0.0,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '2_3'},\n", + " {0: 0.7755102040816326,\n", + " 1: 0.8687224669603524,\n", + " 2: 0.6434108527131783,\n", + " 3: 0.36336633663366336,\n", + " 4: 0.9969450101832994,\n", + " 5: 0.968609865470852,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.6602040816326531,\n", + " 1: 0.8546255506607929,\n", + " 2: 0.5968992248062015,\n", + " 3: 0.2376237623762376,\n", + " 4: 0.9969450101832994,\n", + " 5: 0.9820627802690582,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.6755102040816326,\n", + " 1: 0.8563876651982378,\n", + " 2: 0.5406976744186046,\n", + " 3: 0.22574257425742575,\n", + " 4: 0.9959266802443992,\n", + " 5: 0.9899103139013453,\n", + " 6: 0.0,\n", + " 7: 0.0,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '4_5'},\n", + " {0: 0.6816326530612244,\n", + " 1: 0.8590308370044053,\n", + " 2: 0.46027131782945735,\n", + " 3: 0.48415841584158414,\n", + " 4: 0.7036659877800407,\n", + " 5: 0.6322869955156951,\n", + " 6: 0.9895615866388309,\n", + " 7: 0.97568093385214,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.6959183673469388,\n", + " 1: 0.8537444933920705,\n", + " 2: 0.46511627906976744,\n", + " 3: 0.46633663366336636,\n", + " 4: 0.6466395112016293,\n", + " 5: 0.5426008968609866,\n", + " 6: 0.9916492693110647,\n", + " 7: 0.9854085603112841,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.6489795918367347,\n", + " 1: 0.8414096916299559,\n", + " 2: 0.437015503875969,\n", + " 3: 0.4277227722772277,\n", + " 4: 0.5723014256619144,\n", + " 5: 0.5134529147982063,\n", + " 6: 0.9937369519832986,\n", + " 7: 0.9902723735408561,\n", + " 8: 0.0,\n", + " 9: 0.0,\n", + " 'phase': '6_7'},\n", + " {0: 0.7244897959183674,\n", + " 1: 0.8255506607929516,\n", + " 2: 0.5087209302325582,\n", + " 3: 0.404950495049505,\n", + " 4: 0.37474541751527496,\n", + " 5: 0.4024663677130045,\n", + " 6: 0.8162839248434238,\n", + " 7: 0.5710116731517509,\n", + " 8: 0.9702258726899384,\n", + " 9: 0.9653121902874133,\n", + " 'phase': '8_9'},\n", + " {0: 0.6979591836734694,\n", + " 1: 0.786784140969163,\n", + " 2: 0.45542635658914726,\n", + " 3: 0.3425742574257426,\n", + " 4: 0.31771894093686354,\n", + " 5: 0.33408071748878926,\n", + " 6: 0.791231732776618,\n", + " 7: 0.5671206225680934,\n", + " 8: 0.9784394250513347,\n", + " 9: 0.9682854311199207,\n", + " 'phase': '8_9'},\n", + " {0: 0.6602040816326531,\n", + " 1: 0.7797356828193832,\n", + " 2: 0.47674418604651164,\n", + " 3: 0.37524752475247525,\n", + " 4: 0.3289205702647658,\n", + " 5: 0.3475336322869955,\n", + " 6: 0.7682672233820459,\n", + " 7: 0.5311284046692607,\n", + " 8: 0.9866529774127311,\n", + " 9: 0.9672943508424182,\n", + " 'phase': '8_9'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9982378854625551,\n", + " 2: 0.5562015503875969,\n", + " 3: 0.5554455445544555,\n", + " 4: 0.5030549898167006,\n", + " 5: 0.36771300448430494,\n", + " 6: 0.6847599164926931,\n", + " 7: 0.7324902723735408,\n", + " 8: 0.7197125256673511,\n", + " 9: 0.8582755203171457,\n", + " 'phase': '0_1_again'},\n", + " {0: 0.996938775510204,\n", + " 1: 0.9982378854625551,\n", + " 2: 0.4844961240310077,\n", + " 3: 0.498019801980198,\n", + " 4: 0.4979633401221996,\n", + " 5: 0.40582959641255606,\n", + " 6: 0.6670146137787056,\n", + " 7: 0.72568093385214,\n", + " 8: 0.6745379876796714,\n", + " 9: 0.8394449950445986,\n", + " 'phase': '0_1_again'},\n", + " {0: 0.9959183673469387,\n", + " 1: 0.9991189427312775,\n", + " 2: 0.4932170542635659,\n", + " 3: 0.5148514851485149,\n", + " 4: 0.505091649694501,\n", + " 5: 0.39798206278026904,\n", + " 6: 0.6524008350730689,\n", + " 7: 0.7227626459143969,\n", + " 8: 0.6714579055441479,\n", + " 9: 0.846382556987116,\n", + " 'phase': '0_1_again'}]" + ] + }, + "metadata": {}, + "execution_count": 20 } ] }, @@ -3067,11 +2125,571 @@ }, { "cell_type": "code", - "execution_count": 18, + "execution_count": 11, "metadata": { - "id": "gimHfUXdW4_K" + "id": "gimHfUXdW4_K", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 459 + }, + "outputId": "3a07ff95-27df-468d-f571-414c99f1ca1e" }, - "outputs": [], + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + " epoch 0 1 2 3 4 5 6 7 8 9 phase\n", + "0 0 0.96 0.97 0.82 0.85 0.59 0.35 0.86 0.85 0.52 0.82 baseline" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epoch0123456789phase
000.960.970.820.850.590.350.860.850.520.82baseline
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ] + }, + "metadata": {} + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + " epoch 0 1 2 3 4 5 6 7 8 9 phase\n", + "0 0 1.0 1.0 0.00 0.0 0.00 0.00 0.0 0.00 0.0 0.00 0_1\n", + "1 1 0.0 0.0 0.14 1.0 0.00 0.00 0.0 0.00 0.0 0.00 2_3\n", + "2 2 0.0 0.0 0.00 0.0 0.99 0.89 0.0 0.00 0.0 0.00 4_5\n", + "3 3 0.0 0.0 0.00 0.0 0.00 0.00 1.0 0.93 0.0 0.00 6_7\n", + "4 4 0.0 0.0 0.00 0.0 0.00 0.00 0.0 0.00 1.0 0.52 8_9" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epoch0123456789phase
001.01.00.000.00.000.000.00.000.00.000_1
110.00.00.141.00.000.000.00.000.00.002_3
220.00.00.000.00.990.890.00.000.00.004_5
330.00.00.000.00.000.001.00.930.00.006_7
440.00.00.000.00.000.000.00.001.00.528_9
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ] + }, + "metadata": {} + }, + { + "output_type": "display_data", + "data": { + "text/plain": [ + " epoch 0 1 2 3 4 5 6 7 8 9 phase\n", + "0 0 1.00 0.99 0.00 0.00 0.00 0.00 0.00 0.00 0.00 0.00 0_1\n", + "1 1 0.04 0.51 0.23 1.00 0.00 0.00 0.00 0.00 0.00 0.00 2_3\n", + "2 2 0.71 0.64 0.06 0.00 0.98 0.85 0.00 0.00 0.00 0.00 4_5\n", + "3 3 0.23 0.53 0.00 0.01 0.00 0.00 0.99 0.96 0.00 0.00 6_7\n", + "4 4 0.44 0.55 0.00 0.00 0.00 0.00 0.19 0.00 0.98 0.88 8_9" + ], + "text/html": [ + "\n", + "
\n", + "
\n", + "
\n", + "\n", + "\n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + " \n", + "
epoch0123456789phase
001.000.990.000.000.000.000.000.000.000.000_1
110.040.510.231.000.000.000.000.000.000.002_3
220.710.640.060.000.980.850.000.000.000.004_5
330.230.530.000.010.000.000.990.960.000.006_7
440.440.550.000.000.000.000.190.000.980.888_9
\n", + "
\n", + " \n", + " \n", + " \n", + "\n", + " \n", + "
\n", + "
\n", + " " + ] + }, + "metadata": {} + } + ], "source": [ "# The following helper code takes the logs and converts them into a dataframe\n", "# for easier reading. You can also store the result as a CSV or HDF file by\n", @@ -3087,17 +2705,33 @@ " return logs\n", "\n", "#display(format_results(history_regular_mnist).head())\n", - "#display(format_results(history_catastrophic_forgetting).head())\n", - "#display(format_results(history_memory_replay).head())" + "display(format_results(history_catastrophic_forgetting).head())\n", + "display(format_results(history_memory_replay).head())" ] }, { "cell_type": "code", - "execution_count": null, + "execution_count": 25, "metadata": { - "id": "jR6eRKn4WguU" + "id": "jR6eRKn4WguU", + "colab": { + "base_uri": "https://localhost:8080/", + "height": 807 + }, + "outputId": "a20c835b-1f62-4b6c-cd45-745f122a0041" }, - "outputs": [], + "outputs": [ + { + "output_type": "display_data", + "data": { + "text/plain": [ + "
" + ], + "image/png": "\n" + }, + "metadata": {} + } + ], "source": [ "# Finally, we plot the results and optionally compare the three different training setups.\n", "# Try to adapt and extend the plotting function to the needs of your experimental setup.\n", @@ -3105,12 +2739,13 @@ "import matplotlib.pyplot as plt\n", "import seaborn as sns\n", "\n", - "fig, axes = plt.subplots(10, 2,figsize = (5, 7), sharex = True)\n", + "fig, axes = plt.subplots(10, 2, figsize = (6, 8), sharex = True)\n", "\n", "# Iterate over the different training setups for comparison\n", "for log_id, logs in enumerate([history_catastrophic_forgetting, history_memory_replay]):\n", " # Format the logs into a dataframe\n", " logs = format_results(logs)\n", + "\n", " # Iterate through the 10 different MNIST classes (0...9). We will plot one subpanel\n", " # for each of them, showing the accuracies for that particular class over the course\n", " # of the entire training.\n", @@ -3124,24 +2759,13 @@ " \n", " # Finally, we will optimize the plot a bit and remove unneeded lines\n", " ax.set_ylim([0, 1])\n", + " ax.set_ylabel(f\"Acc '{class_}'\")\n", " sns.despine(bottom = True, trim = True)\n", "\n", - "axes[-1].set_xlabel(\"Epochs\")\n", + " ax.set_xlabel(\"Epochs\")\n", + "plt.tight_layout()\n", "plt.show()" ] - }, - { - "cell_type": "markdown", - "source": [ - "Here are some example outputs:\n", - "\n", - "| With catastrophic forgetting | Training setup using a regularizer |\n", - "|-|-|\n", - "|![image.png]() |![image.png]() |" - ], - "metadata": { - "id": "5RolXP_mTxwp" - } } ], "metadata": {