From e8a70c0f1e30e8af70ebee373fe077500c190287 Mon Sep 17 00:00:00 2001 From: Ben Akka Zakariae <zakariae.ben-akka@etu.ec-lyon.fr> Date: Thu, 23 Nov 2023 11:17:53 +0000 Subject: [PATCH] Upload New File --- TD2_Deep_Learning.ipynb | 993 ++++++++++++++++++++++++++++++++++++++++ 1 file changed, 993 insertions(+) create mode 100644 TD2_Deep_Learning.ipynb diff --git a/TD2_Deep_Learning.ipynb b/TD2_Deep_Learning.ipynb new file mode 100644 index 0000000..fd619c2 --- /dev/null +++ b/TD2_Deep_Learning.ipynb @@ -0,0 +1,993 @@ +{ + "cells": [ + { + "cell_type": "markdown", + "id": "7edf7168", + "metadata": {}, + "source": [ + "# TD2: Deep learning" + ] + }, + { + "cell_type": "markdown", + "id": "fbb8c8df", + "metadata": {}, + "source": [ + "In this TD, you must modify this notebook to answer the questions. To do this,\n", + "\n", + "1. Fork this repository\n", + "2. Clone your forked repository on your local computer\n", + "3. Answer the questions\n", + "4. Commit and push regularly\n", + "\n", + "The last commit is due on Sunday, December 1, 11:59 PM. Later commits will not be taken into account." + ] + }, + { + "cell_type": "markdown", + "id": "3d167a29", + "metadata": {}, + "source": [ + "Install and test PyTorch from https://pytorch.org/get-started/locally." + ] + }, + { + "cell_type": "code", + "execution_count": 4, + "id": "330a42f5", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Requirement already satisfied: torch in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (2.1.0+cu118)\n", + "Requirement already satisfied: torchvision in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (0.16.0+cu118)\n", + "Requirement already satisfied: filelock in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (3.9.0)\n", + "Requirement already satisfied: typing-extensions in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (4.4.0)\n", + "Requirement already satisfied: sympy in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (1.12)\n", + "Requirement already satisfied: networkx in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (3.0)\n", + "Requirement already satisfied: jinja2 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (3.1.2)\n", + "Requirement already satisfied: fsspec in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torch) (2023.4.0)\n", + "Requirement already satisfied: numpy in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torchvision) (1.26.1)\n", + "Requirement already satisfied: requests in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torchvision) (2.31.0)\n", + "Requirement already satisfied: pillow!=8.3.*,>=5.3.0 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from torchvision) (10.1.0)\n", + "Requirement already satisfied: MarkupSafe>=2.0 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from jinja2->torch) (2.1.2)\n", + "Requirement already satisfied: charset-normalizer<4,>=2 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from requests->torchvision) (3.3.1)\n", + "Requirement already satisfied: idna<4,>=2.5 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from requests->torchvision) (3.4)\n", + "Requirement already satisfied: urllib3<3,>=1.21.1 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from requests->torchvision) (2.0.7)\n", + "Requirement already satisfied: certifi>=2017.4.17 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from requests->torchvision) (2023.7.22)\n", + "Requirement already satisfied: mpmath>=0.19 in c:\\users\\lenovo\\appdata\\local\\packages\\pythonsoftwarefoundation.python.3.11_qbz5n2kfra8p0\\localcache\\local-packages\\python311\\site-packages (from sympy->torch) (1.3.0)\n", + "Note: you may need to restart the kernel to use updated packages.\n" + ] + } + ], + "source": [ + "%pip install torch torchvision" + ] + }, + { + "cell_type": "markdown", + "id": "0882a636", + "metadata": {}, + "source": [ + "\n", + "To test run the following code" + ] + }, + { + "cell_type": "code", + "execution_count": 5, + "id": "b1950f0a", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "tensor([[ 1.0605, 0.4877, 1.3848, -0.5006, 0.0414, 0.2985, 0.1982, 0.5928,\n", + " 0.4444, 0.3458],\n", + " [-0.1176, -1.5951, -1.1404, 0.6262, -1.0974, -0.7637, 0.4559, 0.3599,\n", + " 0.7854, 0.1764],\n", + " [ 0.2529, 0.4114, 1.5469, 0.2975, -0.9362, -1.0877, 0.3287, 1.8137,\n", + " 0.9959, -0.9416],\n", + " [ 0.8527, -1.1763, 1.0453, 0.2173, 1.2337, -0.4122, -0.4660, 0.5123,\n", + " -0.5657, 0.2373],\n", + " [-0.5439, 0.9611, 0.8822, -1.0495, -0.8781, -0.9642, -0.9343, 0.6947,\n", + " -0.1654, -0.6049],\n", + " [-1.2154, 1.4457, 0.5532, 0.5507, 0.9646, 1.6836, -0.7217, -1.5023,\n", + " -0.1566, -0.0864],\n", + " [ 2.1407, 0.1364, 0.5218, 0.5398, 0.8079, 1.3318, 0.1576, 0.7597,\n", + " 1.8427, -0.1918],\n", + " [-0.4011, -2.5381, 0.6992, -0.8056, 0.1494, -0.8711, -1.0129, 0.4020,\n", + " 0.1074, 1.4686],\n", + " [-0.1769, 1.0718, 0.6540, -1.6458, 2.1758, 0.0703, 0.7089, 0.9214,\n", + " 1.4192, -0.5498],\n", + " [-1.4553, -0.0320, 0.4980, -0.9733, 0.4106, -0.4363, 1.5308, -0.8421,\n", + " 0.0412, -2.0390],\n", + " [ 0.1056, 0.6472, -0.1967, 0.9547, 0.8193, -1.4786, -0.5792, -0.1598,\n", + " -0.1151, 0.0905],\n", + " [ 0.6584, -2.2935, 0.0100, -1.8383, 2.2067, -0.1495, 0.0839, 2.0443,\n", + " -1.7859, -0.5420],\n", + " [ 0.4898, -0.1235, 0.4655, -0.9289, -0.8926, -2.5259, 0.4773, -0.2087,\n", + " 2.2034, 0.1863],\n", + " [-1.3225, 0.4705, -0.3551, -0.0710, -0.4115, -0.2432, -1.2216, 1.2093,\n", + " -0.1206, 1.0373]])\n", + "AlexNet(\n", + " (features): Sequential(\n", + " (0): Conv2d(3, 64, kernel_size=(11, 11), stride=(4, 4), padding=(2, 2))\n", + " (1): ReLU(inplace=True)\n", + " (2): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)\n", + " (3): Conv2d(64, 192, kernel_size=(5, 5), stride=(1, 1), padding=(2, 2))\n", + " (4): ReLU(inplace=True)\n", + " (5): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)\n", + " (6): Conv2d(192, 384, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (7): ReLU(inplace=True)\n", + " (8): Conv2d(384, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (9): ReLU(inplace=True)\n", + " (10): Conv2d(256, 256, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (11): ReLU(inplace=True)\n", + " (12): MaxPool2d(kernel_size=3, stride=2, padding=0, dilation=1, ceil_mode=False)\n", + " )\n", + " (avgpool): AdaptiveAvgPool2d(output_size=(6, 6))\n", + " (classifier): Sequential(\n", + " (0): Dropout(p=0.5, inplace=False)\n", + " (1): Linear(in_features=9216, out_features=4096, bias=True)\n", + " (2): ReLU(inplace=True)\n", + " (3): Dropout(p=0.5, inplace=False)\n", + " (4): Linear(in_features=4096, out_features=4096, bias=True)\n", + " (5): ReLU(inplace=True)\n", + " (6): Linear(in_features=4096, out_features=1000, bias=True)\n", + " )\n", + ")\n" + ] + } + ], + "source": [ + "import torch\n", + "\n", + "N, D = 14, 10\n", + "x = torch.randn(N, D).type(torch.FloatTensor)\n", + "print(x)\n", + "\n", + "from torchvision import models\n", + "\n", + "alexnet = models.alexnet()\n", + "print(alexnet)" + ] + }, + { + "cell_type": "markdown", + "id": "23f266da", + "metadata": {}, + "source": [ + "## Exercise 1: CNN on CIFAR10\n", + "\n", + "The goal is to apply a Convolutional Neural Net (CNN) model on the CIFAR10 image dataset and test the accuracy of the model on the basis of image classification. Compare the Accuracy VS the neural network implemented during TD1.\n", + "\n", + "Have a look at the following documentation to be familiar with PyTorch.\n", + "\n", + "https://pytorch.org/tutorials/beginner/pytorch_with_examples.html\n", + "\n", + "https://pytorch.org/tutorials/beginner/deep_learning_60min_blitz.html" + ] + }, + { + "cell_type": "markdown", + "id": "4ba1c82d", + "metadata": {}, + "source": [ + "You can test if GPU is available on your machine and thus train on it to speed up the process" + ] + }, + { + "cell_type": "code", + "execution_count": 6, + "id": "6e18f2fd", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "CUDA is not available. Training on CPU ...\n" + ] + } + ], + "source": [ + "import torch\n", + "\n", + "# check if CUDA is available\n", + "train_on_gpu = torch.cuda.is_available()\n", + "\n", + "if not train_on_gpu:\n", + " print(\"CUDA is not available. Training on CPU ...\")\n", + "else:\n", + " print(\"CUDA is available! Training on GPU ...\")" + ] + }, + { + "cell_type": "markdown", + "id": "5cf214eb", + "metadata": {}, + "source": [ + "Next we load the CIFAR10 dataset" + ] + }, + { + "cell_type": "code", + "execution_count": 7, + "id": "462666a2", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Files already downloaded and verified\n", + "Files already downloaded and verified\n" + ] + } + ], + "source": [ + "import numpy as np\n", + "from torchvision import datasets, transforms\n", + "from torch.utils.data.sampler import SubsetRandomSampler\n", + "\n", + "# number of subprocesses to use for data loading\n", + "num_workers = 0\n", + "# how many samples per batch to load\n", + "batch_size = 20\n", + "# percentage of training set to use as validation\n", + "valid_size = 0.2\n", + "\n", + "# convert data to a normalized torch.FloatTensor\n", + "transform = transforms.Compose(\n", + " [transforms.ToTensor(), transforms.Normalize((0.5, 0.5, 0.5), (0.5, 0.5, 0.5))]\n", + ")\n", + "\n", + "# choose the training and test datasets\n", + "train_data = datasets.CIFAR10(\"data\", train=True, download=True, transform=transform)\n", + "test_data = datasets.CIFAR10(\"data\", train=False, download=True, transform=transform)\n", + "\n", + "# obtain training indices that will be used for validation\n", + "num_train = len(train_data)\n", + "indices = list(range(num_train))\n", + "np.random.shuffle(indices)\n", + "split = int(np.floor(valid_size * num_train))\n", + "train_idx, valid_idx = indices[split:], indices[:split]\n", + "\n", + "# define samplers for obtaining training and validation batches\n", + "train_sampler = SubsetRandomSampler(train_idx)\n", + "valid_sampler = SubsetRandomSampler(valid_idx)\n", + "\n", + "# prepare data loaders (combine dataset and sampler)\n", + "train_loader = torch.utils.data.DataLoader(\n", + " train_data, batch_size=batch_size, sampler=train_sampler, num_workers=num_workers\n", + ")\n", + "valid_loader = torch.utils.data.DataLoader(\n", + " train_data, batch_size=batch_size, sampler=valid_sampler, num_workers=num_workers\n", + ")\n", + "test_loader = torch.utils.data.DataLoader(\n", + " test_data, batch_size=batch_size, num_workers=num_workers\n", + ")\n", + "\n", + "# specify the image classes\n", + "classes = [\n", + " \"airplane\",\n", + " \"automobile\",\n", + " \"bird\",\n", + " \"cat\",\n", + " \"deer\",\n", + " \"dog\",\n", + " \"frog\",\n", + " \"horse\",\n", + " \"ship\",\n", + " \"truck\",\n", + "]" + ] + }, + { + "cell_type": "markdown", + "id": "58ec3903", + "metadata": {}, + "source": [ + "CNN definition (this one is an example)" + ] + }, + { + "cell_type": "code", + "execution_count": 15, + "id": "317bf070", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Net(\n", + " (conv1): Conv2d(3, 6, kernel_size=(5, 5), stride=(1, 1))\n", + " (pool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n", + " (conv2): Conv2d(6, 16, kernel_size=(5, 5), stride=(1, 1))\n", + " (fc1): Linear(in_features=400, out_features=120, bias=True)\n", + " (fc2): Linear(in_features=120, out_features=84, bias=True)\n", + " (fc3): Linear(in_features=84, out_features=10, bias=True)\n", + ")\n" + ] + } + ], + "source": [ + "import torch.nn as nn\n", + "import torch.nn.functional as F\n", + "\n", + "# define the CNN architecture\n", + "\n", + "\n", + "class Net(nn.Module):\n", + " def __init__(self):\n", + " super(Net, self).__init__()\n", + " self.conv1 = nn.Conv2d(3, 6, 5)\n", + " self.pool = nn.MaxPool2d(2, 2)\n", + " self.conv2 = nn.Conv2d(6, 16, 5)\n", + " self.fc1 = nn.Linear(16 * 5 * 5, 120)\n", + " self.fc2 = nn.Linear(120, 84)\n", + " self.fc3 = nn.Linear(84, 10)\n", + "\n", + " def forward(self, x):\n", + " x = self.pool(F.relu(self.conv1(x)))\n", + " x = self.pool(F.relu(self.conv2(x)))\n", + " x = x.view(-1, 16 * 5 * 5)\n", + " x = F.relu(self.fc1(x))\n", + " x = F.relu(self.fc2(x))\n", + " x = self.fc3(x)\n", + " return x\n", + "\n", + "\n", + "# create a complete CNN\n", + "model = Net()\n", + "print(model)\n", + "# move tensors to GPU if CUDA is available\n", + "if train_on_gpu:\n", + " model.cuda()" + ] + }, + { + "cell_type": "markdown", + "id": "a2dc4974", + "metadata": {}, + "source": [ + "Loss function and training using SGD (Stochastic Gradient Descent) optimizer" + ] + }, + { + "cell_type": "code", + "execution_count": 16, + "id": "4b53f229", + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Epoch: 0 \tTraining Loss: 42.825791 \tValidation Loss: 38.047178\n", + "Validation loss decreased (inf --> 38.047178). Saving model ...\n", + "Epoch: 1 \tTraining Loss: 34.432099 \tValidation Loss: 32.259117\n", + "Validation loss decreased (38.047178 --> 32.259117). Saving model ...\n", + "Epoch: 2 \tTraining Loss: 30.593193 \tValidation Loss: 29.343884\n", + "Validation loss decreased (32.259117 --> 29.343884). Saving model ...\n", + "Epoch: 3 \tTraining Loss: 28.517643 \tValidation Loss: 28.747610\n", + "Validation loss decreased (29.343884 --> 28.747610). Saving model ...\n", + "Epoch: 4 \tTraining Loss: 27.061891 \tValidation Loss: 26.789136\n", + "Validation loss decreased (28.747610 --> 26.789136). Saving model ...\n", + "Epoch: 5 \tTraining Loss: 25.740426 \tValidation Loss: 25.652807\n", + "Validation loss decreased (26.789136 --> 25.652807). Saving model ...\n", + "Epoch: 6 \tTraining Loss: 24.557613 \tValidation Loss: 24.589273\n", + "Validation loss decreased (25.652807 --> 24.589273). Saving model ...\n", + "Epoch: 7 \tTraining Loss: 23.515031 \tValidation Loss: 25.103045\n", + "Epoch: 8 \tTraining Loss: 22.581234 \tValidation Loss: 24.104360\n", + "Validation loss decreased (24.589273 --> 24.104360). Saving model ...\n", + "Epoch: 9 \tTraining Loss: 21.738190 \tValidation Loss: 23.372788\n", + "Validation loss decreased (24.104360 --> 23.372788). Saving model ...\n", + "Epoch: 10 \tTraining Loss: 20.909772 \tValidation Loss: 23.101869\n", + "Validation loss decreased (23.372788 --> 23.101869). Saving model ...\n", + "Epoch: 11 \tTraining Loss: 20.140882 \tValidation Loss: 22.718813\n", + "Validation loss decreased (23.101869 --> 22.718813). Saving model ...\n", + "Epoch: 12 \tTraining Loss: 19.447754 \tValidation Loss: 22.743659\n", + "Epoch: 13 \tTraining Loss: 18.741209 \tValidation Loss: 21.960046\n", + "Validation loss decreased (22.718813 --> 21.960046). Saving model ...\n", + "Epoch: 14 \tTraining Loss: 18.086207 \tValidation Loss: 23.175453\n", + "Epoch: 15 \tTraining Loss: 17.524023 \tValidation Loss: 22.036695\n", + "Epoch: 16 \tTraining Loss: 16.883423 \tValidation Loss: 21.853538\n", + "Validation loss decreased (21.960046 --> 21.853538). Saving model ...\n", + "Epoch: 17 \tTraining Loss: 16.315123 \tValidation Loss: 22.812885\n", + "Epoch: 18 \tTraining Loss: 15.772240 \tValidation Loss: 22.325363\n", + "Epoch: 19 \tTraining Loss: 15.269639 \tValidation Loss: 22.520727\n", + "Epoch: 20 \tTraining Loss: 14.745204 \tValidation Loss: 22.754284\n", + "Epoch: 21 \tTraining Loss: 14.261328 \tValidation Loss: 22.611392\n", + "Epoch: 22 \tTraining Loss: 13.771852 \tValidation Loss: 24.175723\n", + "Epoch: 23 \tTraining Loss: 13.320821 \tValidation Loss: 23.895067\n", + "Epoch: 24 \tTraining Loss: 12.871154 \tValidation Loss: 24.741432\n", + "Epoch: 25 \tTraining Loss: 12.380433 \tValidation Loss: 24.762289\n", + "Epoch: 26 \tTraining Loss: 11.955164 \tValidation Loss: 24.945322\n", + "Epoch: 27 \tTraining Loss: 11.516984 \tValidation Loss: 26.506488\n", + "Epoch: 28 \tTraining Loss: 11.121875 \tValidation Loss: 26.109028\n", + "Epoch: 29 \tTraining Loss: 10.736281 \tValidation Loss: 26.803389\n" + ] + } + ], + "source": [ + "import torch.optim as optim\n", + "\n", + "criterion = nn.CrossEntropyLoss() # specify loss function\n", + "optimizer = optim.SGD(model.parameters(), lr=0.01) # specify optimizer\n", + "\n", + "n_epochs = 30 # number of epochs to train the model\n", + "train_loss_list = [] # list to store loss to visualize\n", + "valid_loss_min = np.Inf # track change in validation loss\n", + "\n", + "for epoch in range(n_epochs):\n", + " # Keep track of training and validation loss\n", + " train_loss = 0.0\n", + " valid_loss = 0.0\n", + "\n", + " # Train the model\n", + " model.train()\n", + " for data, target in train_loader:\n", + " # Move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # Clear the gradients of all optimized variables\n", + " optimizer.zero_grad()\n", + " # Forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # Calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # Backward pass: compute gradient of the loss with respect to model parameters\n", + " loss.backward()\n", + " # Perform a single optimization step (parameter update)\n", + " optimizer.step()\n", + " # Update training loss\n", + " train_loss += loss.item() * data.size(0)\n", + "\n", + " # Validate the model\n", + " model.eval()\n", + " for data, target in valid_loader:\n", + " # Move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # Forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # Calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # Update average validation loss\n", + " valid_loss += loss.item() * data.size(0)\n", + "\n", + " # Calculate average losses\n", + " train_loss = train_loss / len(train_loader)\n", + " valid_loss = valid_loss / len(valid_loader)\n", + " train_loss_list.append(train_loss)\n", + "\n", + " # Print training/validation statistics\n", + " print(\n", + " \"Epoch: {} \\tTraining Loss: {:.6f} \\tValidation Loss: {:.6f}\".format(\n", + " epoch, train_loss, valid_loss\n", + " )\n", + " )\n", + "\n", + " # Save model if validation loss has decreased\n", + " if valid_loss <= valid_loss_min:\n", + " print(\n", + " \"Validation loss decreased ({:.6f} --> {:.6f}). Saving model ...\".format(\n", + " valid_loss_min, valid_loss\n", + " )\n", + " )\n", + " torch.save(model.state_dict(), \"model_cifar.pt\")\n", + " valid_loss_min = valid_loss" + ] + }, + { + "cell_type": "markdown", + "id": "13e1df74", + "metadata": {}, + "source": [ + "Does overfit occur? If so, do an early stopping." + ] + }, + { + "cell_type": "code", + "execution_count": 17, + "id": "d39df818", + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "<Figure size 640x480 with 1 Axes>" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "plt.plot(range(n_epochs), train_loss_list)\n", + "plt.xlabel(\"Epoch\")\n", + "plt.ylabel(\"Loss\")\n", + "plt.title(\"Performance of Model 1\")\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Now loading the model with the lowest validation loss value" + ] + }, + { + "cell_type": "code", + "execution_count": 18, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Test Loss: 21.960862\n", + "\n", + "Test Accuracy of airplane: 68% (681/1000)\n", + "Test Accuracy of automobile: 74% (740/1000)\n", + "Test Accuracy of bird: 45% (452/1000)\n", + "Test Accuracy of cat: 51% (518/1000)\n", + "Test Accuracy of deer: 55% (550/1000)\n", + "Test Accuracy of dog: 50% (505/1000)\n", + "Test Accuracy of frog: 73% (730/1000)\n", + "Test Accuracy of horse: 66% (669/1000)\n", + "Test Accuracy of ship: 79% (796/1000)\n", + "Test Accuracy of truck: 62% (621/1000)\n", + "\n", + "Test Accuracy (Overall): 62% (6262/10000)\n" + ] + } + ], + "source": [ + "model.load_state_dict(torch.load(\"./model_cifar.pt\"))\n", + "\n", + "# track test loss\n", + "test_loss = 0.0\n", + "class_correct = list(0.0 for i in range(10))\n", + "class_total = list(0.0 for i in range(10))\n", + "\n", + "model.eval()\n", + "# iterate over test data\n", + "for data, target in test_loader:\n", + " # move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # update test loss\n", + " test_loss += loss.item() * data.size(0)\n", + " # convert output probabilities to predicted class\n", + " _, pred = torch.max(output, 1)\n", + " # compare predictions to true label\n", + " correct_tensor = pred.eq(target.data.view_as(pred))\n", + " correct = (\n", + " np.squeeze(correct_tensor.numpy())\n", + " if not train_on_gpu\n", + " else np.squeeze(correct_tensor.cpu().numpy())\n", + " )\n", + " # calculate test accuracy for each object class\n", + " for i in range(batch_size):\n", + " label = target.data[i]\n", + " class_correct[label] += correct[i].item()\n", + " class_total[label] += 1\n", + "\n", + "# average test loss\n", + "test_loss = test_loss / len(test_loader)\n", + "print(\"Test Loss: {:.6f}\\n\".format(test_loss))\n", + "\n", + "for i in range(10):\n", + " if class_total[i] > 0:\n", + " print(\n", + " \"Test Accuracy of %5s: %2d%% (%2d/%2d)\"\n", + " % (\n", + " classes[i],\n", + " 100 * class_correct[i] / class_total[i],\n", + " np.sum(class_correct[i]),\n", + " np.sum(class_total[i]),\n", + " )\n", + " )\n", + " else:\n", + " print(\"Test Accuracy of %5s: N/A (no training examples)\" % (classes[i]))\n", + "\n", + "print(\n", + " \"\\nTest Accuracy (Overall): %2d%% (%2d/%2d)\"\n", + " % (\n", + " 100.0 * np.sum(class_correct) / np.sum(class_total),\n", + " np.sum(class_correct),\n", + " np.sum(class_total),\n", + " )\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Second Network :" + ] + }, + { + "cell_type": "code", + "execution_count": 2, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Second_Net(\n", + " (conv1): Conv2d(3, 16, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (pool): MaxPool2d(kernel_size=2, stride=2, padding=0, dilation=1, ceil_mode=False)\n", + " (conv2): Conv2d(16, 32, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (conv3): Conv2d(32, 64, kernel_size=(3, 3), stride=(1, 1), padding=(1, 1))\n", + " (fc1): Linear(in_features=1024, out_features=512, bias=True)\n", + " (fc2): Linear(in_features=512, out_features=64, bias=True)\n", + " (fc3): Linear(in_features=64, out_features=10, bias=True)\n", + ")\n" + ] + } + ], + "source": [ + "import torch.nn as nn\n", + "import torch.nn.functional as F\n", + "\n", + "# define the CNN architecture\n", + "\n", + "\n", + "class Second_Net(nn.Module):\n", + " def __init__(self):\n", + " super(Second_Net, self).__init__()\n", + " self.conv1 = nn.Conv2d(3, 16, 3, padding=1)\n", + " # H_out(conv1) = W_out(conv1) = (H_in + 2*padding - Kernel)/stride + 1 = (32 + 2 - 3)/1 + 1 = 32\n", + " # Size(conv1_out) = 32*32*16\n", + " self.pool = nn.MaxPool2d(2, 2) # pool = 16*16\n", + " # H_out(conv2) = W_out(conv2) = (H_in + 2*padding - Kernel)/stride + 1 = (16 + 2 - 3)/1 + 1 = 16\n", + " self.conv2 = nn.Conv2d(16, 32, 3, padding=1)\n", + " # H_out(conv3) = W_out(conv3) = (H_in + 2*padding - Kernel)/stride + 1 = (16 + 2 - 3)/1 + 1 = 8\n", + " self.conv3 = nn.Conv2d(32, 64, 3, padding=1) \n", + " self.fc1 = nn.Linear(64 * 4 * 4, 512)\n", + " self.fc2 = nn.Linear(512, 64)\n", + " self.fc3 = nn.Linear(64, 10)\n", + "\n", + " def forward(self, x):\n", + " x = self.pool(F.relu(self.conv1(x)))\n", + " x = self.pool(F.relu(self.conv2(x)))\n", + " x = self.pool(F.relu(self.conv3(x)))\n", + " x = x.view(-1, 64 * 4 * 4)\n", + " x = F.relu(self.fc1(x))\n", + " x = F.relu(self.fc2(x))\n", + " x = self.fc3(x)\n", + " return x\n", + "\n", + "\n", + "# create a complete CNN\n", + "model = Second_Net()\n", + "print(model)\n", + "# move tensors to GPU if CUDA is available\n", + "# if train_on_gpu:\n", + " # model.cuda()" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + " Training the new model" + ] + }, + { + "cell_type": "code", + "execution_count": 8, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Epoch: 0 \tTraining Loss: 45.224616 \tValidation Loss: 41.426994\n", + "Validation loss decreased (inf --> 41.426994). Saving model ...\n", + "Epoch: 1 \tTraining Loss: 36.723764 \tValidation Loss: 32.832016\n", + "Validation loss decreased (41.426994 --> 32.832016). Saving model ...\n", + "Epoch: 2 \tTraining Loss: 31.097073 \tValidation Loss: 29.986182\n", + "Validation loss decreased (32.832016 --> 29.986182). Saving model ...\n", + "Epoch: 3 \tTraining Loss: 27.964499 \tValidation Loss: 26.652988\n", + "Validation loss decreased (29.986182 --> 26.652988). Saving model ...\n", + "Epoch: 4 \tTraining Loss: 25.368614 \tValidation Loss: 25.234237\n", + "Validation loss decreased (26.652988 --> 25.234237). Saving model ...\n", + "Epoch: 5 \tTraining Loss: 23.028257 \tValidation Loss: 22.257799\n", + "Validation loss decreased (25.234237 --> 22.257799). Saving model ...\n", + "Epoch: 6 \tTraining Loss: 21.007300 \tValidation Loss: 21.598088\n", + "Validation loss decreased (22.257799 --> 21.598088). Saving model ...\n", + "Epoch: 7 \tTraining Loss: 19.216898 \tValidation Loss: 20.251749\n", + "Validation loss decreased (21.598088 --> 20.251749). Saving model ...\n", + "Epoch: 8 \tTraining Loss: 17.697483 \tValidation Loss: 20.098650\n", + "Validation loss decreased (20.251749 --> 20.098650). Saving model ...\n", + "Epoch: 9 \tTraining Loss: 16.180104 \tValidation Loss: 18.660767\n", + "Validation loss decreased (20.098650 --> 18.660767). Saving model ...\n", + "Epoch: 10 \tTraining Loss: 14.774329 \tValidation Loss: 17.974099\n", + "Validation loss decreased (18.660767 --> 17.974099). Saving model ...\n", + "Epoch: 11 \tTraining Loss: 13.394195 \tValidation Loss: 17.683563\n", + "Validation loss decreased (17.974099 --> 17.683563). Saving model ...\n", + "Epoch: 12 \tTraining Loss: 12.029678 \tValidation Loss: 18.618383\n", + "Epoch: 13 \tTraining Loss: 10.594165 \tValidation Loss: 18.077175\n", + "Epoch: 14 \tTraining Loss: 9.346292 \tValidation Loss: 19.066724\n", + "Epoch: 15 \tTraining Loss: 7.995027 \tValidation Loss: 20.780326\n", + "Epoch: 16 \tTraining Loss: 6.687421 \tValidation Loss: 21.976052\n", + "Epoch: 17 \tTraining Loss: 5.550229 \tValidation Loss: 22.871844\n", + "Epoch: 18 \tTraining Loss: 4.561936 \tValidation Loss: 24.607759\n", + "Epoch: 19 \tTraining Loss: 3.798454 \tValidation Loss: 25.928546\n", + "Epoch: 20 \tTraining Loss: 2.968054 \tValidation Loss: 26.749855\n", + "Epoch: 21 \tTraining Loss: 2.694036 \tValidation Loss: 30.236186\n", + "Epoch: 22 \tTraining Loss: 2.217052 \tValidation Loss: 30.743367\n", + "Epoch: 23 \tTraining Loss: 1.851026 \tValidation Loss: 31.145896\n", + "Epoch: 24 \tTraining Loss: 1.434988 \tValidation Loss: 33.876719\n", + "Epoch: 25 \tTraining Loss: 1.226250 \tValidation Loss: 36.642382\n", + "Epoch: 26 \tTraining Loss: 1.181099 \tValidation Loss: 35.523206\n", + "Epoch: 27 \tTraining Loss: 0.926557 \tValidation Loss: 37.227898\n", + "Epoch: 28 \tTraining Loss: 1.313841 \tValidation Loss: 38.011964\n", + "Epoch: 29 \tTraining Loss: 0.968135 \tValidation Loss: 38.862978\n" + ] + } + ], + "source": [ + "import torch.optim as optim \n", + "model = Second_Net()\n", + "\n", + "criterion = nn.CrossEntropyLoss() # specify loss function\n", + "optimizer = optim.SGD(model.parameters(), lr=0.01) # specify optimizer\n", + "\n", + "n_epochs = 30 # number of epochs to train the model\n", + "train_loss_list = [] # list to store loss to visualize\n", + "valid_loss_min = np.Inf # track change in validation loss\n", + "\n", + "for epoch in range(n_epochs):\n", + " # Keep track of training and validation loss\n", + " train_loss = 0.0\n", + " valid_loss = 0.0\n", + "\n", + " # Train the model\n", + " model.train()\n", + " for data, target in train_loader:\n", + " # Move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # Clear the gradients of all optimized variables\n", + " optimizer.zero_grad()\n", + " # Forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # Calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # Backward pass: compute gradient of the loss with respect to model parameters\n", + " loss.backward()\n", + " # Perform a single optimization step (parameter update)\n", + " optimizer.step()\n", + " # Update training loss\n", + " train_loss += loss.item() * data.size(0)\n", + "\n", + " # Validate the model\n", + " model.eval()\n", + " for data, target in valid_loader:\n", + " # Move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # Forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # Calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # Update average validation loss\n", + " valid_loss += loss.item() * data.size(0)\n", + "\n", + " # Calculate average losses\n", + " train_loss = train_loss / len(train_loader)\n", + " valid_loss = valid_loss / len(valid_loader)\n", + " train_loss_list.append(train_loss)\n", + "\n", + " # Print training/validation statistics\n", + " print(\n", + " \"Epoch: {} \\tTraining Loss: {:.6f} \\tValidation Loss: {:.6f}\".format(\n", + " epoch, train_loss, valid_loss\n", + " )\n", + " )\n", + "\n", + " # Save model if validation loss has decreased\n", + " if valid_loss <= valid_loss_min:\n", + " print(\n", + " \"Validation loss decreased ({:.6f} --> {:.6f}). Saving model ...\".format(\n", + " valid_loss_min, valid_loss\n", + " )\n", + " )\n", + " torch.save(model.state_dict(), \"new_model_cifar.pt\")\n", + " valid_loss_min = valid_loss" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Loading the second model with the lowest validation loss value" + ] + }, + { + "cell_type": "code", + "execution_count": 9, + "metadata": {}, + "outputs": [ + { + "name": "stdout", + "output_type": "stream", + "text": [ + "Test Loss: 17.850414\n", + "\n", + "Test Accuracy of airplane: 79% (794/1000)\n", + "Test Accuracy of automobile: 87% (873/1000)\n", + "Test Accuracy of bird: 58% (585/1000)\n", + "Test Accuracy of cat: 40% (402/1000)\n", + "Test Accuracy of deer: 61% (616/1000)\n", + "Test Accuracy of dog: 67% (670/1000)\n", + "Test Accuracy of frog: 73% (732/1000)\n", + "Test Accuracy of horse: 76% (769/1000)\n", + "Test Accuracy of ship: 77% (779/1000)\n", + "Test Accuracy of truck: 73% (731/1000)\n", + "\n", + "Test Accuracy (Overall): 69% (6951/10000)\n" + ] + } + ], + "source": [ + "model.load_state_dict(torch.load(\"./new_model_cifar.pt\"))\n", + "\n", + "# track test loss\n", + "test_loss = 0.0\n", + "class_correct = list(0.0 for i in range(10))\n", + "class_total = list(0.0 for i in range(10))\n", + "\n", + "model.eval()\n", + "# iterate over test data\n", + "for data, target in test_loader:\n", + " # move tensors to GPU if CUDA is available\n", + " if train_on_gpu:\n", + " data, target = data.cuda(), target.cuda()\n", + " # forward pass: compute predicted outputs by passing inputs to the model\n", + " output = model(data)\n", + " # calculate the batch loss\n", + " loss = criterion(output, target)\n", + " # update test loss\n", + " test_loss += loss.item() * data.size(0)\n", + " # convert output probabilities to predicted class\n", + " _, pred = torch.max(output, 1)\n", + " # compare predictions to true label\n", + " correct_tensor = pred.eq(target.data.view_as(pred))\n", + " correct = (\n", + " np.squeeze(correct_tensor.numpy())\n", + " if not train_on_gpu\n", + " else np.squeeze(correct_tensor.cpu().numpy())\n", + " )\n", + " # calculate test accuracy for each object class\n", + " for i in range(batch_size):\n", + " label = target.data[i]\n", + " class_correct[label] += correct[i].item()\n", + " class_total[label] += 1\n", + "\n", + "# average test loss\n", + "test_loss = test_loss / len(test_loader)\n", + "print(\"Test Loss: {:.6f}\\n\".format(test_loss))\n", + "\n", + "for i in range(10):\n", + " if class_total[i] > 0:\n", + " print(\n", + " \"Test Accuracy of %5s: %2d%% (%2d/%2d)\"\n", + " % (\n", + " classes[i],\n", + " 100 * class_correct[i] / class_total[i],\n", + " np.sum(class_correct[i]),\n", + " np.sum(class_total[i]),\n", + " )\n", + " )\n", + " else:\n", + " print(\"Test Accuracy of %5s: N/A (no training examples)\" % (classes[i]))\n", + "\n", + "print(\n", + " \"\\nTest Accuracy (Overall): %2d%% (%2d/%2d)\"\n", + " % (\n", + " 100.0 * np.sum(class_correct) / np.sum(class_total),\n", + " np.sum(class_correct),\n", + " np.sum(class_total),\n", + " )\n", + ")" + ] + }, + { + "cell_type": "markdown", + "metadata": {}, + "source": [ + "Plot Loss in function epoch for the new model" + ] + }, + { + "cell_type": "code", + "execution_count": 10, + "metadata": {}, + "outputs": [ + { + "data": { + "image/png": "", + "text/plain": [ + "<Figure size 640x480 with 1 Axes>" + ] + }, + "metadata": {}, + "output_type": "display_data" + } + ], + "source": [ + "import matplotlib.pyplot as plt\n", + "\n", + "plt.plot(range(n_epochs), train_loss_list)\n", + "plt.xlabel(\"Epoch\")\n", + "plt.ylabel(\"Loss\")\n", + "plt.title(\"Performance of Model 1\")\n", + "plt.show()" + ] + }, + { + "cell_type": "markdown", + "id": "944991a2", + "metadata": {}, + "source": [ + "Build a new network with the following structure.\n", + "\n", + "- It has 3 convolutional layers of kernel size 3 and padding of 1.\n", + "- The first convolutional layer must output 16 channels, the second 32 and the third 64.\n", + "- At each convolutional layer output, we apply a ReLU activation then a MaxPool with kernel size of 2.\n", + "- Then, three fully connected layers, the first two being followed by a ReLU activation and a dropout whose value you will suggest.\n", + "- The first fully connected layer will have an output size of 512.\n", + "- The second fully connected layer will have an output size of 64.\n", + "\n", + "Compare the results obtained with this new network to those obtained previously." + ] + } + ], + "metadata": { + "kernelspec": { + "display_name": "Python 3.8.5 ('base')", + "language": "python", + "name": "python3" + }, + "language_info": { + "codemirror_mode": { + "name": "ipython", + "version": 3 + }, + "file_extension": ".py", + "mimetype": "text/x-python", + "name": "python", + "nbconvert_exporter": "python", + "pygments_lexer": "ipython3", + "version": "3.11.6" + }, + "vscode": { + "interpreter": { + "hash": "9e3efbebb05da2d4a1968abe9a0645745f54b63feb7a85a514e4da0495be97eb" + } + } + }, + "nbformat": 4, + "nbformat_minor": 5 +} -- GitLab