francescomontagna · Jul 20, 2020
diff --git a/‎baselines.ipynb
+149-474 b/‎baselines.ipynb
+149-474
@@ -111,6 +111,7 @@
         "from data.cifar100 import Cifar100\n",
         "from model.resnet_cifar import resnet32\n",
         "from model.manager import Manager\n",
+        "from model.lwf import LWF\n",
         "from model.icarl import Exemplars\n",
         "from model.icarl import iCaRL\n",
         "from utils import plot"
@@ -301,7 +302,7 @@
         "    criterion = nn.BCEWithLogitsLoss()\n",
         "    \n",
         "    for split_i in range(10):\n",
-        "        print(f\"# Split {split_i} of run {run_i}\")\n",
+        "        print(f\"## Split {split_i} of run {run_i} ##\")\n",
         "\n",
         "        parameters_to_optimize = net.parameters()\n",
         "        optimizer = optim.SGD(parameters_to_optimize, lr=LR, momentum=MOMENTUM, weight_decay=WEIGHT_DECAY)\n",
@@ -326,30 +327,14 @@
         "        test_accuracy, all_targets, all_preds = manager.test()\n",
         "\n",
         "        logs[run_i][split_i]['test_accuracy'] = test_accuracy\n",
+        "        logs[run_i][split_i]['conf_mat'] = confusion_matrix(all_targets.to('cpu'), all_preds.to('cpu'))\n",
         "\n",
         "        # Add 10 nodes to last FC layer\n",
         "        manager.increment_classes(n=10)"
       ],
       "execution_count": null,
       "outputs": []
     },
-    {
-      "cell_type": "code",
-      "metadata": {
-        "colab_type": "code",
-        "id": "JWdj0wvu996S",
-        "colab": {}
-      },
-      "source": [
-        "# Confusion matrix over last run test predictions\n",
-        "targets = test_dataset.targets\n",
-        "preds = all_preds.to('cpu').numpy()\n",
-        "\n",
-        "plot.heatmap_cm(targets, preds)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
     {
       "cell_type": "code",
       "metadata": {
@@ -415,32 +400,6 @@
         "## Learning Without Forgetting"
       ]
     },
-    {
-      "cell_type": "markdown",
-      "metadata": {
-        "id": "ERL_PF-cm1N_",
-        "colab_type": "text"
-      },
-      "source": [
-        "### Arguments"
-      ]
-    },
-    {
-      "cell_type": "code",
-      "metadata": {
-        "colab_type": "code",
-        "id": "JHBfXPTXm16d",
-        "colab": {}
-      },
-      "source": [
-        "# Training settings for Learning Without Forgetting\n",
-        "RANDOM_STATES = [658, 423, 422] \n",
-        "BATCH_SIZE = 128\n",
-        "LR = 2"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
     {
       "cell_type": "markdown",
       "metadata": {
@@ -486,38 +445,36 @@
         "test_dataloaders = [[] for i in range(NUM_RUNS)]\n",
         "\n",
         "for run_i in range(NUM_RUNS):\n",
+        "    test_subsets = []\n",
+        "    random_state = RANDOM_STATES[run_i]\n",
         "\n",
-        "  test_subsets = []\n",
-        "  random_state = RANDOM_STATES[run_i]\n",
+        "    for split_i in range(10):\n",
+        "        # Download dataset only at first instantiation\n",
+        "        if run_i+split_i == 0:\n",
+        "            download = True\n",
+        "        else:\n",
+        "            download = False\n",
         "\n",
-        "  for split_i in range(CLASS_BATCH_SIZE):\n",
+        "        # Create CIFAR100 dataset\n",
+        "        train_dataset = Cifar100(DATA_DIR, train=True, download=download, random_state=random_state, transform=train_transform)\n",
+        "        test_dataset = Cifar100(DATA_DIR, train=False, download=False, random_state=random_state, transform=test_transform)\n",
         "\n",
-        "    # Download dataset only at first instantiation\n",
-        "    if(run_i+split_i == 0):\n",
-        "      download = True\n",
-        "    else:\n",
-        "      download = False\n",
+        "        # Subspace of CIFAR100 of 10 classes\n",
+        "        train_dataset.set_classes_batch(train_dataset.batch_splits[split_i])\n",
+        "        test_dataset.set_classes_batch([test_dataset.batch_splits[i] for i in range(0, split_i+1)])\n",
         "\n",
-        "    # Create CIFAR100 dataset\n",
-        "    train_dataset = Cifar100(DATA_DIR, train = True, download = download, random_state = random_state, transform=train_transform)\n",
-        "    test_dataset = Cifar100(DATA_DIR, train = False, download = False, random_state = random_state, transform=test_transform)\n",
-        "   \n",
-        "    # Subspace of CIFAR100 of 10 classes\n",
-        "    train_dataset.set_classes_batch(train_dataset.batch_splits[split_i]) \n",
-        "    test_dataset.set_classes_batch([test_dataset.batch_splits[i] for i in range(0, split_i+1)])\n",
+        "        # Define train and validation indices\n",
+        "        train_indices, val_indices = train_dataset.train_val_split(VAL_SIZE, random_state)\n",
         "\n",
-        "    # Define train and validation indices\n",
-        "    train_indices, val_indices = train_dataset.train_val_split(VAL_SIZE, random_state)\n",
-        "    \n",
-        "    train_dataloaders[run_i].append(DataLoader(Subset(train_dataset, train_indices), \n",
-        "                               batch_size=BATCH_SIZE, shuffle=True, num_workers=4, drop_last=True))\n",
-        "    \n",
-        "    val_dataloaders[run_i].append(DataLoader(Subset(train_dataset, val_indices), \n",
-        "                                batch_size=BATCH_SIZE, shuffle=True, num_workers=4, drop_last=True))\n",
-        "    \n",
-        "    # Dataset with all seen class\n",
-        "    test_dataloaders[run_i].append(DataLoader(test_dataset, \n",
-        "                               batch_size=BATCH_SIZE, shuffle=True, num_workers=4))           "
+        "        train_dataloaders[run_i].append(DataLoader(Subset(train_dataset, train_indices),\n",
+        "                                                   batch_size=BATCH_SIZE, shuffle=True, num_workers=4, drop_last=True))\n",
+        "\n",
+        "        val_dataloaders[run_i].append(DataLoader(Subset(train_dataset, val_indices),\n",
+        "                                                 batch_size=BATCH_SIZE, shuffle=True, num_workers=4, drop_last=True))\n",
+        "\n",
+        "        # Dataset with all seen class\n",
+        "        test_dataloaders[run_i].append(DataLoader(test_dataset,\n",
+        "                                                  batch_size=BATCH_SIZE, shuffle=True, num_workers=4))"
       ],
       "execution_count": null,
       "outputs": []
@@ -534,417 +491,161 @@
         "dataiter = iter(test_dataloaders[0][5])\n",
         "images, labels = dataiter.next()\n",
         "\n",
-        "plot.image_grid(images, one_channel=False)\n",
-        "unique_labels = np.unique(labels, return_counts=True)\n",
-        "unique_labels"
+        "plot.image_grid(images, one_channel=False)"
       ],
       "execution_count": null,
       "outputs": []
     },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "iYwMtMJuLyYe",
+        "colab_type": "text"
+      },
+      "source": [
+        "### Execution"
+      ]
+    },
     {
       "cell_type": "code",
       "metadata": {
-        "id": "cw6a_xAumXQW",
+        "id": "JpGuC_hSL0jN",
         "colab_type": "code",
         "colab": {}
       },
       "source": [
-        "from torch.nn import BCEWithLogitsLoss\n",
-        "from copy import deepcopy\n",
-        "\n",
-        "'''BCE formulation:\n",
-        " let x = logits, z = labels. The logistic loss is\n",
-        "\n",
-        "  z * -log(sigmoid(x)) + (1 - z) * -log(1 - sigmoid(x))\n",
-        "'''\n",
-        "\n",
-        "   \n",
-        "CLASS_BATCH_SIZE = 10\n",
-        "\n",
-        "\n",
-        "class LWF():\n",
-        "  def __init__(self, device, net, old_net, criterion, optimizer, scheduler,\n",
-        "               train_dataloader, val_dataloader, test_dataloader, num_classes=10):\n",
-        "    \n",
-        "    self.device = device\n",
-        "\n",
-        "    self.net = net\n",
-        "    self.best_net = self.net\n",
-        "    self.old_net = old_net # None for first ten classes\n",
-        "\n",
-        "    self.criterion = BCEWithLogitsLoss() # Classifier criterion \n",
-        "    self.optimizer = optimizer\n",
-        "    self.scheduler = scheduler\n",
-        "\n",
-        "    self.train_dataloader = train_dataloader\n",
-        "    self.val_dataloader = val_dataloader\n",
-        "    self.test_dataloader = test_dataloader\n",
-        "\n",
-        "    self.num_classes = num_classes # can be incremented ouitside methods in the main, or inside methods\n",
-        "    self.order = np.arange(100)\n",
-        "\n",
-        "    self.sigmoid = nn.Sigmoid()\n",
-        "\n",
-        "\n",
-        "  def warm_up():\n",
-        "    pass\n",
-        "\n",
-        "  def increment_classes(self, n=10):\n",
-        "    \"\"\"Add n classes in the final fully connected layer.\"\"\"\n",
-        "\n",
-        "    in_features = self.net.fc.in_features  # size of each input sample\n",
-        "    out_features = self.net.fc.out_features  # size of each output sample\n",
-        "    weight = self.net.fc.weight.data\n",
-        "\n",
-        "    self.net.fc = nn.Linear(in_features, out_features+n)\n",
-        "    self.net.fc.weight.data[:out_features] = weight\n",
-        "\n",
-        "  def to_onehot(self, targets): \n",
-        "    '''\n",
-        "    Args:\n",
-        "    targets : dataloader.dataset.targets of the new task images\n",
-        "    '''\n",
-        "    one_hot_targets = torch.eye(self.num_classes)[targets]\n",
-        "\n",
-        "    return one_hot_targets.to(self.device)\n",
-        "\n",
-        "  def do_first_batch(self, batch, labels):\n",
-        "\n",
-        "    batch = batch.to(self.device)\n",
-        "    labels = labels.to(self.device) # new classes labels\n",
-        "\n",
-        "    # Zero-ing the gradients\n",
-        "    self.optimizer.zero_grad()\n",
-        "\n",
-        "    # One hot encoding of new task labels \n",
-        "    one_hot_labels = self.to_onehot(labels) # Size = [128, 10]\n",
-        "\n",
-        "    # New net forward pass\n",
-        "    outputs = self.net(batch)  \n",
-        "    \n",
-        "    loss = self.criterion(outputs, one_hot_labels) # BCE Loss with sigmoids over outputs\n",
-        "\n",
-        "    # Get predictions\n",
-        "    _, preds = torch.max(outputs.data, 1)\n",
-        "\n",
-        "    # Accuracy over NEW IMAGES, not over all images\n",
-        "    running_corrects = \\\n",
-        "        torch.sum(preds == labels.data).data.item() # Può essere che debba usare targets e non labels\n",
-        "\n",
-        "    # Backward pass: computes gradients\n",
-        "    loss.backward()\n",
-        "\n",
-        "    self.optimizer.step()\n",
-        "\n",
-        "    return loss, running_corrects\n",
-        "\n",
-        "\n",
-        "  def do_batch(self, batch, labels):\n",
-        "\n",
-        "    batch = batch.to(self.device)\n",
-        "    labels = labels.to(self.device) # new classes labels\n",
-        "\n",
-        "    # Zero-ing the gradients\n",
-        "    self.optimizer.zero_grad()\n",
-        "\n",
-        "    # One hot encoding of new task labels \n",
-        "    one_hot_labels = self.to_onehot(labels) # Size = [128, n_classes] will be sliced as [:, :self.num_classes-10]\n",
-        "    new_classes = (self.order[range(self.num_classes-10, self.num_classes)]).astype(np.int32)\n",
-        "    one_hot_labels = torch.stack([one_hot_labels[:, i] for i in new_classes], axis=1)\n",
-        "\n",
-        "    # Old net forward pass\n",
-        "    old_outputs = self.sigmoid(self.old_net(batch)) # Size = [128, 100]\n",
-        "    old_classes = (self.order[range(self.num_classes-10)]).astype(np.int32)\n",
-        "    old_outputs = torch.stack([old_outputs[:, i] for i in old_classes], axis =1)\n",
-        "    \n",
-        "    # Combine new and old class targets\n",
-        "    targets = torch.cat((old_outputs, one_hot_labels), 1)\n",
-        "\n",
-        "    # New net forward pass\n",
-        "    outputs = self.net(batch) # Size = [128, 100] comparable with the define targets\n",
-        "    out_classes = (self.order[range(self.num_classes)]).astype(np.int32)\n",
-        "    outputs = torch.stack([outputs[:, i] for i in out_classes], axis=1)\n",
-        "  \n",
-        "    \n",
-        "    loss = self.criterion(outputs, targets) # BCE Loss with sigmoids over outputs (over targets must be done manually)\n",
-        "\n",
-        "    # Get predictions\n",
-        "    _, preds = torch.max(outputs.data, 1)\n",
-        "\n",
-        "    # Accuracy over NEW IMAGES, not over all images\n",
-        "    running_corrects = \\\n",
-        "        torch.sum(preds == labels.data).data.item() \n",
-        "\n",
-        "    # Backward pass: computes gradients\n",
-        "    loss.backward()\n",
-        "\n",
-        "    self.optimizer.step()\n",
-        "\n",
-        "    return loss, running_corrects\n",
-        "\n",
-        "\n",
-        "  def do_epoch(self, current_epoch):\n",
-        "\n",
-        "    self.net.train()\n",
-        "\n",
-        "    running_train_loss = 0\n",
-        "    running_corrects = 0\n",
-        "    total = 0\n",
-        "    batch_idx = 0\n",
-        "\n",
-        "    print(f\"Epoch: {current_epoch}, LR: {self.scheduler.get_last_lr()}\")\n",
-        "\n",
-        "    for images, labels in self.train_dataloader:\n",
-        "\n",
-        "      if self.num_classes == CLASS_BATCH_SIZE:\n",
-        "        loss, corrects = self.do_first_batch(images, labels)\n",
-        "      else:\n",
-        "        loss, corrects = self.do_batch(images, labels)\n",
-        "\n",
-        "      running_train_loss += loss.item()\n",
-        "      running_corrects += corrects\n",
-        "      total += labels.size(0)\n",
-        "      batch_idx += 1\n",
-        "\n",
-        "    self.scheduler.step()\n",
-        "\n",
-        "    # Calculate average scores\n",
-        "    train_loss = running_train_loss / batch_idx # Average over all batches\n",
-        "    train_accuracy = running_corrects / float(total) # Average over all samples\n",
-        "\n",
-        "    print(f\"Train loss: {train_loss}, Train accuracy: {train_accuracy}\")\n",
-        "\n",
-        "    return (train_loss, train_accuracy)\n",
-        "\n",
+        "# Arguments for Learning without Forgetting\n",
+        "BATCH_SIZE = 128\n",
+        "LR = 2"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "MlThDLCvXJwS",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "logs = [[] for _ in range(NUM_RUNS)]\n",
         "\n",
-        "  def train(self, num_epochs):\n",
-        "    \"\"\"Train the network for a specified number of epochs, and save\n",
-        "    the best performing model on the validation set.\n",
-        "    \n",
-        "    Args:\n",
-        "        num_epochs (int): number of epochs for training the network.\n",
-        "    Returns:\n",
-        "        train_loss: loss computed on the last epoch\n",
-        "        train_accuracy: accuracy computed on the last epoch\n",
-        "        val_loss: average loss on the validation set of the last epoch\n",
-        "        val_accuracy: accuracy on the validation set of the last epoch\n",
-        "    \"\"\"\n",
-        "\n",
-        "    # @todo: is the return behaviour intended? (scores of the last epoch)\n",
-        "\n",
-        "    self.net = self.net.to(self.device)\n",
-        "    if self.old_net != None:\n",
-        "      self.old_net = self.old_net.to(self.device)\n",
-        "      self.old_net.train(False)\n",
-        "\n",
-        "    cudnn.benchmark  # Calling this optimizes runtime\n",
-        "\n",
-        "    self.best_loss = float(\"inf\")\n",
-        "    self.best_epoch = 0\n",
-        "\n",
-        "    for epoch in range(num_epochs):\n",
-        "        # Run an epoch (start counting form 1)\n",
-        "        train_loss, train_accuracy = self.do_epoch(epoch+1)\n",
+        "# Iterate over runs\n",
+        "for run_i in range(NUM_RUNS):\n",
+        "    net = resnet32()\n",
         "    \n",
-        "        # Validate after each epoch \n",
-        "        val_loss, val_accuracy = self.validate()    \n",
-        "\n",
-        "        # Best validation model\n",
-        "        if val_loss < self.best_loss:\n",
-        "            self.best_loss = val_loss\n",
-        "            self.best_net = deepcopy(self.net)\n",
-        "            self.best_epoch = epoch\n",
-        "            print(\"Best model updated\")\n",
-        "\n",
-        "        print(\"\")\n",
-        "\n",
-        "    return (train_loss, train_accuracy,\n",
-        "            val_loss, val_accuracy)\n",
-        "\n",
-        "\n",
-        "  def validate(self):\n",
-        "    \"\"\"Validate the model.\n",
+        "    criterion = nn.BCEWithLogitsLoss()\n",
         "    \n",
-        "    Returns:\n",
-        "        val_loss: average loss function computed on the network outputs\n",
-        "            of the validation set (val_dataloader).\n",
-        "        val_accuracy: accuracy computed on the validation set.\n",
-        "    \"\"\"\n",
-        "\n",
-        "    self.net.train(False)\n",
-        "\n",
-        "    running_val_loss = 0\n",
-        "    running_corrects = 0\n",
-        "    total = 0\n",
-        "    batch_idx = 0\n",
-        "\n",
-        "\n",
-        "    for batch, labels in self.val_dataloader:\n",
-        "      batch = batch.to(self.device)\n",
-        "      labels = labels.to(self.device)\n",
-        "      total += labels.size(0)\n",
-        "\n",
-        "      # One hot encoding of new task labels \n",
-        "      one_hot_labels = self.to_onehot(labels) # Size = [128, 100] will be sliced as [:, :self.num_classes-10]\n",
-        "      new_classes = (self.order[range(self.num_classes-10, self.num_classes)]).astype(np.int32)\n",
-        "      one_hot_labels = torch.stack([one_hot_labels[:, i] for i in new_classes], axis=1)\n",
-        "\n",
-        "      if self.num_classes > 10:\n",
-        "        # Old net forward pass\n",
-        "        old_outputs = self.sigmoid(self.old_net(batch)) # Size = [128, 100]\n",
-        "        old_classes = (self.order[range(self.num_classes-10)]).astype(np.int32)\n",
-        "        old_outputs = torch.stack([old_outputs[:, i] for i in old_classes], axis =1)\n",
-        "\n",
-        "        # Combine new and old class targets\n",
-        "        targets = torch.cat((old_outputs, one_hot_labels), 1)\n",
-        "\n",
-        "      else:\n",
-        "        targets = one_hot_labels\n",
-        "\n",
-        "      # New net forward pass\n",
-        "      outputs = self.net(batch) # Size = [128, 100] comparable with the define targets\n",
-        "      out_classes = (self.order[range(self.num_classes)]).astype(np.int32)\n",
-        "      outputs = torch.stack([outputs[:, i] for i in out_classes], axis=1)\n",
-        "\n",
-        "      \n",
-        "      loss = self.criterion(outputs, targets) # BCE Loss with sigmoids over outputs (over targets must be done manually)\n",
-        "\n",
-        "      # Get predictions\n",
-        "      _, preds = torch.max(outputs.data, 1)\n",
-        "\n",
-        "      # Update the number of correctly classified validation samples\n",
-        "      running_corrects += torch.sum(preds == labels.data).data.item()\n",
-        "      running_val_loss += loss.item()\n",
-        "\n",
-        "      batch_idx += 1\n",
-        "\n",
-        "    # Calcuate scores\n",
-        "    val_loss = running_val_loss / batch_idx\n",
-        "    val_accuracy = running_corrects / float(total)\n",
-        "\n",
-        "    print(f\"Validation loss: {val_loss}, Validation accuracy: {val_accuracy}\")\n",
-        "\n",
-        "    return (val_loss, val_accuracy)\n",
-        "\n",
-        "\n",
-        "  def test(self):\n",
-        "    \"\"\"Test the model.\n",
-        "    Returns:\n",
-        "        accuracy (float): accuracy of the model on the test set\n",
-        "    \"\"\"\n",
-        "\n",
-        "    self.best_net.train(False)  # Set Network to evaluation mode\n",
-        "\n",
-        "    running_corrects = 0\n",
-        "    total = 0\n",
+        "    for split_i in range(10):\n",
+        "        print(f\"## Split {split_i} of run {run_i} ##\")\n",
         "\n",
-        "    all_preds = torch.tensor([]) # to store all predictions\n",
-        "    all_preds = all_preds.type(torch.LongTensor)\n",
-        "    \n",
-        "    for images, labels in self.test_dataloader:\n",
-        "      images = images.to(self.device)\n",
-        "      labels = labels.to(self.device)\n",
-        "      total += labels.size(0)\n",
+        "        # Redefine optimizer at each split (pass by reference issue)\n",
+        "        parameters_to_optimize = net.parameters()\n",
+        "        optimizer = optim.SGD(parameters_to_optimize, lr=LR,\n",
+        "                                momentum=MOMENTUM, weight_decay=WEIGHT_DECAY)\n",
+        "        scheduler = optim.lr_scheduler.MultiStepLR(optimizer, \n",
+        "                                                    milestones=MILESTONES, gamma=GAMMA)\n",
+        "\n",
+        "        num_classes = 10*(split_i+1)\n",
+        "\n",
+        "        if num_classes == 10: # old network == None\n",
+        "            lwf = LWF(DEVICE, net, None, criterion, optimizer, scheduler,\n",
+        "                            train_dataloaders[run_i][split_i],\n",
+        "                            val_dataloaders[run_i][split_i],\n",
+        "                            test_dataloaders[run_i][split_i],\n",
+        "                            num_classes)\n",
+        "        else:\n",
+        "            lwf = LWF(DEVICE, net, old_net, criterion, optimizer, scheduler,\n",
+        "                            train_dataloaders[run_i][split_i],\n",
+        "                            val_dataloaders[run_i][split_i],\n",
+        "                            test_dataloaders[run_i][split_i],\n",
+        "                            num_classes)\n",
         "\n",
-        "      # Forward Pass\n",
-        "      outputs = self.best_net(images)\n",
+        "        scores = lwf.train(NUM_EPOCHS)  # train the model\n",
         "\n",
-        "      # Get predictions\n",
-        "      _, preds = torch.max(outputs.data, 1)\n",
+        "        logs[run_i].append({})\n",
         "\n",
-        "      # Update Corrects\n",
-        "      running_corrects += torch.sum(preds == labels.data).data.item()\n",
+        "        # score[i] = dictionary with key:epoch, value: score\n",
+        "        logs[run_i][split_i]['train_loss'] = scores[0]\n",
+        "        logs[run_i][split_i]['train_accuracy'] = scores[1]\n",
+        "        logs[run_i][split_i]['val_loss'] = scores[2]\n",
+        "        logs[run_i][split_i]['val_accuracy'] = scores[3]\n",
         "\n",
-        "      # Append batch predictions\n",
-        "      all_preds = torch.cat(\n",
-        "          (all_preds.to(self.device), preds.to(self.device)), dim=0\n",
-        "      )\n",
+        "        # Test the model on classes seen until now\n",
+        "        test_accuracy, all_targets, all_preds = lwf.test()\n",
         "\n",
-        "    # Calculate accuracy\n",
-        "    accuracy = running_corrects / float(total)  \n",
+        "        logs[run_i][split_i]['test_accuracy'] = test_accuracy\n",
+        "        logs[run_i][split_i]['conf_mat'] = confusion_matrix(all_targets.to('cpu'), all_preds.to('cpu'))\n",
         "\n",
-        "    print(f\"Test accuracy: {accuracy}\")\n",
+        "        old_net = deepcopy(lwf.net)\n",
         "\n",
-        "    return (accuracy, all_preds)"
+        "        lwf.increment_classes()"
       ],
       "execution_count": null,
       "outputs": []
     },
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "2xZbK6EGSaZN",
+        "colab_type": "text"
+      },
+      "source": [
+        "### Plots"
+      ]
+    },
     {
       "cell_type": "code",
       "metadata": {
-        "id": "MlThDLCvXJwS",
+        "id": "bUfgSq1xSbrD",
         "colab_type": "code",
         "colab": {}
       },
       "source": [
-        "train_loss_history = []\n",
-        "train_accuracy_history = []\n",
-        "val_loss_history = []\n",
-        "val_accuracy_history = []\n",
-        "test_accuracy_history = []\n",
-        "\n",
-        "\n",
-        "\n",
-        "# Iterate over runs\n",
-        "for train_dataloader, val_dataloader, test_dataloader in zip(train_dataloaders,\n",
-        "                                                             val_dataloaders, test_dataloaders):\n",
-        "  \n",
-        "    \n",
-        "    train_loss_history.append({})\n",
-        "    train_accuracy_history.append({})\n",
-        "    val_loss_history.append({})\n",
-        "    val_accuracy_history.append({})\n",
-        "    test_accuracy_history.append({})\n",
-        "\n",
-        "    net = resnet32()  # Define the net\n",
-        "    \n",
-        "    criterion = nn.BCEWithLogitsLoss()  # Define the loss\n",
-        "        \n",
-        "    \n",
-        "    i = 0\n",
-        "    for train_split, val_split, test_split in zip(train_dataloader,\n",
-        "                                                  val_dataloader, test_dataloader):\n",
-        "      \n",
-        "      # Redefine optimizer at each split (pass by reference issue)\n",
-        "      parameters_to_optimize = net.parameters()\n",
-        "      optimizer = optim.SGD(parameters_to_optimize, lr=LR,\n",
-        "                            momentum=MOMENTUM, weight_decay=WEIGHT_DECAY)\n",
-        "      scheduler = optim.lr_scheduler.MultiStepLR(optimizer, \n",
-        "                                                milestones=MILESTONES, gamma=GAMMA)\n",
-        "        \n",
-        "      current_split = \"Split %i\"%(i)\n",
-        "      print(current_split)\n",
-        "\n",
-        "      num_classes = CLASS_BATCH_SIZE*(i+1)\n",
-        "\n",
-        "      if num_classes == CLASS_BATCH_SIZE:\n",
-        "        # Old Network = None\n",
-        "        lwf = LWF(DEVICE, net, None, criterion, optimizer, scheduler,\n",
-        "                          train_split, val_split, test_split, num_classes)\n",
-        "      else:\n",
-        "        lwf = LWF(DEVICE, net, old_net, criterion, optimizer, scheduler,\n",
-        "                        train_split, val_split, test_split, num_classes)\n",
-        "        \n",
-        "\n",
-        "      scores = lwf.train(NUM_EPOCHS)  # train the model\n",
-        "\n",
-        "      # score[i] = dictionary with key:epoch, value: score\n",
-        "      train_loss_history[-1][current_split] = scores[0]\n",
-        "      train_accuracy_history[-1][current_split] = scores[1]\n",
-        "      val_loss_history[-1][current_split] = scores[2]\n",
-        "      val_accuracy_history[-1][current_split] = scores[3]\n",
-        "\n",
-        "      # Test the model on classes seen until now\n",
-        "      test_accuracy, all_preds = lwf.test()\n",
-        "\n",
-        "      test_accuracy_history[-1][current_split] = test_accuracy\n",
+        "train_loss = [[logs[run_i][i]['train_loss'] for i in range(10)] for run_i in range(NUM_RUNS)]\n",
+        "train_accuracy = [[logs[run_i][i]['train_accuracy'] for i in range(10)] for run_i in range(NUM_RUNS)]\n",
+        "val_loss = [[logs[run_i][i]['val_loss'] for i in range(10)] for run_i in range(NUM_RUNS)]\n",
+        "val_accuracy = [[logs[run_i][i]['val_accuracy'] for i in range(10)] for run_i in range(NUM_RUNS)]\n",
+        "test_accuracy = [[logs[run_i][i]['test_accuracy'] for i in range(10)] for run_i in range(NUM_RUNS)]\n",
         "\n",
-        "      # Uncomment if default resnet has 10 node at last FC layer\n",
-        "      old_net = deepcopy(lwf.net)\n",
-        "      lwf.increment_classes()\n",
+        "train_loss = np.array(train_loss)\n",
+        "train_accuracy = np.array(train_accuracy)\n",
+        "val_loss = np.array(val_loss)\n",
+        "val_accuracy = np.array(val_accuracy)\n",
+        "test_accuracy = np.array(test_accuracy)\n",
         "\n",
-        "      i =i+1"
+        "train_loss_stats = np.array([train_loss.mean(0), train_loss.std(0)]).transpose()\n",
+        "train_accuracy_stats = np.array([train_accuracy.mean(0), train_accuracy.std(0)]).transpose()\n",
+        "val_loss_stats = np.array([val_loss.mean(0), val_loss.std(0)]).transpose()\n",
+        "val_accuracy_stats = np.array([val_accuracy.mean(0), val_accuracy.std(0)]).transpose()\n",
+        "test_accuracy_stats = np.array([test_accuracy.mean(0), test_accuracy.std(0)]).transpose()"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab_type": "code",
+        "id": "1w3_YPJCSeli",
+        "colab": {}
+      },
+      "source": [
+        "plot.train_val_scores(train_loss_stats, train_accuracy_stats, val_loss_stats, val_accuracy_stats)"
+      ],
+      "execution_count": null,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "colab_type": "code",
+        "id": "ZSt6-FJbSelp",
+        "colab": {}
+      },
+      "source": [
+        "plot.test_scores(test_accuracy_stats)"
       ],
       "execution_count": null,
       "outputs": []
@@ -1108,32 +809,6 @@
       "execution_count": null,
       "outputs": []
     },
-    {
-      "cell_type": "code",
-      "metadata": {
-        "id": "by8c4Aaa-8ms",
-        "colab_type": "code",
-        "colab": {}
-      },
-      "source": [
-        "print(logs_icarl)"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
-    {
-      "cell_type": "code",
-      "metadata": {
-        "id": "qOCjSFJy_ANm",
-        "colab_type": "code",
-        "colab": {}
-      },
-      "source": [
-        "obj_save(logs_icarl, 'hybrid1_confmat')"
-      ],
-      "execution_count": null,
-      "outputs": []
-    },
     {
       "cell_type": "markdown",
       "metadata": {
@@ -1200,4 +875,4 @@
       "outputs": []
     }
   ]
-}
+}