Created using Colaboratory

tinhb92 · tinhb92 · commit 67639a041bdd · 2019-10-11T21:59:44.000+08:00
diff --git a/deep_learning/lstm.ipynb b/deep_learning/lstm.ipynb
@@ -0,0 +1,244 @@
+{
+  "nbformat": 4,
+  "nbformat_minor": 0,
+  "metadata": {
+    "colab": {
+      "name": "lstm",
+      "provenance": [],
+      "include_colab_link": true
+    },
+    "kernelspec": {
+      "name": "python3",
+      "display_name": "Python 3"
+    }
+  },
+  "cells": [
+    {
+      "cell_type": "markdown",
+      "metadata": {
+        "id": "view-in-github",
+        "colab_type": "text"
+      },
+      "source": [
+        "<a href=\"https://colab.research.google.com/github/tinhb92/relax_ml/blob/master/deep_learning/lstm.ipynb\" target=\"_parent\"><img src=\"https://colab.research.google.com/assets/colab-badge.svg\" alt=\"Open In Colab\"/></a>"
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "414DjyHwHBH7",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "import torch \n",
+        "import torch.nn as nn\n",
+        "import torchvision\n",
+        "import torchvision.transforms as transforms\n",
+        "\n",
+        "# Device configuration\n",
+        "device = torch.device('cuda' if torch.cuda.is_available() else 'cpu')\n",
+        "\n",
+        "# Hyper-parameters\n",
+        "sequence_length = 28\n",
+        "input_size = 28\n",
+        "hidden_size = 128\n",
+        "num_layers = 2\n",
+        "num_classes = 10\n",
+        "batch_size = 100\n",
+        "num_epochs = 2\n",
+        "learning_rate = 0.01"
+      ],
+      "execution_count": 0,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "e2NCj8qbGI2r",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "# MNIST dataset\n",
+        "train_dataset = torchvision.datasets.MNIST(root='../../data/',\n",
+        "                                           train=True, \n",
+        "                                           transform=transforms.ToTensor(),\n",
+        "                                           download=True)\n",
+        "\n",
+        "test_dataset = torchvision.datasets.MNIST(root='../../data/',\n",
+        "                                          train=False, \n",
+        "                                          transform=transforms.ToTensor())\n",
+        "\n",
+        "# Data loader\n",
+        "train_loader = torch.utils.data.DataLoader(dataset=train_dataset,\n",
+        "                                           batch_size=batch_size, \n",
+        "                                           shuffle=True)\n",
+        "\n",
+        "test_loader = torch.utils.data.DataLoader(dataset=test_dataset,\n",
+        "                                          batch_size=batch_size, \n",
+        "                                          shuffle=False)"
+      ],
+      "execution_count": 0,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "o55sVKwpGMLx",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        "# Recurrent neural network (many-to-one)\n",
+        "class RNN(nn.Module):\n",
+        "    def __init__(self, input_size, hidden_size, num_layers, num_classes):\n",
+        "        super(RNN, self).__init__()\n",
+        "        self.hidden_size = hidden_size\n",
+        "        self.num_layers = num_layers\n",
+        "        self.lstm = nn.LSTM(input_size, hidden_size, num_layers, batch_first=True)\n",
+        "        self.fc = nn.Linear(hidden_size, num_classes)\n",
+        "    \n",
+        "    def forward(self, x):\n",
+        "        # Set initial hidden and cell states \n",
+        "        h0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device) \n",
+        "        c0 = torch.zeros(self.num_layers, x.size(0), self.hidden_size).to(device)\n",
+        "        \n",
+        "        # Forward propagate LSTM\n",
+        "        out, _ = self.lstm(x, (h0, c0))  # out: tensor of shape (batch_size, seq_length, hidden_size)\n",
+        "        \n",
+        "        # Decode the hidden state of the last time step\n",
+        "        out = self.fc(out[:, -1, :])\n",
+        "        return out\n",
+        "\n",
+        "model = RNN(input_size, hidden_size, num_layers, num_classes).to(device)"
+      ],
+      "execution_count": 0,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "EeQKqwxAGOod",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 218
+        },
+        "outputId": "5e6bf8ff-34ff-4d39-8e93-c2741f1cf6f8"
+      },
+      "source": [
+        "# Loss and optimizer\n",
+        "criterion = nn.CrossEntropyLoss()\n",
+        "optimizer = torch.optim.Adam(model.parameters(), lr=learning_rate)\n",
+        "\n",
+        "# Train the model\n",
+        "total_step = len(train_loader)\n",
+        "for epoch in range(num_epochs):\n",
+        "    for i, (images, labels) in enumerate(train_loader):\n",
+        "        images = images.reshape(-1, sequence_length, input_size).to(device)\n",
+        "        labels = labels.to(device)\n",
+        "        \n",
+        "        # Forward pass\n",
+        "        outputs = model(images)\n",
+        "        loss = criterion(outputs, labels)\n",
+        "        \n",
+        "        # Backward and optimize\n",
+        "        optimizer.zero_grad()\n",
+        "        loss.backward()\n",
+        "        optimizer.step()\n",
+        "        \n",
+        "        if (i+1) % 100 == 0:\n",
+        "            print ('Epoch [{}/{}], Step [{}/{}], Loss: {:.4f}' \n",
+        "                   .format(epoch+1, num_epochs, i+1, total_step, loss.item()))"
+      ],
+      "execution_count": 22,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Epoch [1/2], Step [100/600], Loss: 0.4692\n",
+            "Epoch [1/2], Step [200/600], Loss: 0.2797\n",
+            "Epoch [1/2], Step [300/600], Loss: 0.1271\n",
+            "Epoch [1/2], Step [400/600], Loss: 0.2750\n",
+            "Epoch [1/2], Step [500/600], Loss: 0.1792\n",
+            "Epoch [1/2], Step [600/600], Loss: 0.0991\n",
+            "Epoch [2/2], Step [100/600], Loss: 0.0826\n",
+            "Epoch [2/2], Step [200/600], Loss: 0.1674\n",
+            "Epoch [2/2], Step [300/600], Loss: 0.1562\n",
+            "Epoch [2/2], Step [400/600], Loss: 0.1447\n",
+            "Epoch [2/2], Step [500/600], Loss: 0.0842\n",
+            "Epoch [2/2], Step [600/600], Loss: 0.0283\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "j-5yxyHfEa7z",
+        "colab_type": "code",
+        "colab": {
+          "base_uri": "https://localhost:8080/",
+          "height": 34
+        },
+        "outputId": "84f5134c-0b9e-42e3-fcaf-42f528a3f363"
+      },
+      "source": [
+        "# Test the model\n",
+        "with torch.no_grad():\n",
+        "    correct = 0\n",
+        "    total = 0\n",
+        "    for images, labels in test_loader:\n",
+        "        images = images.reshape(-1, sequence_length, input_size).to(device)\n",
+        "        labels = labels.to(device)\n",
+        "        outputs = model(images)\n",
+        "        _, predicted = torch.max(outputs.data, 1)\n",
+        "        total += labels.size(0)\n",
+        "        correct += (predicted == labels).sum().item()\n",
+        "\n",
+        "    print('Test Accuracy of the model on the 10000 test images: {} %'.format(100 * correct / total)) \n",
+        "\n",
+        "# Save the model checkpoint\n",
+        "# torch.save(model.state_dict(), 'model.ckpt')"
+      ],
+      "execution_count": 23,
+      "outputs": [
+        {
+          "output_type": "stream",
+          "text": [
+            "Test Accuracy of the model on the 10000 test images: 97.55 %\n"
+          ],
+          "name": "stdout"
+        }
+      ]
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "cs2NL18qEaz2",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        ""
+      ],
+      "execution_count": 0,
+      "outputs": []
+    },
+    {
+      "cell_type": "code",
+      "metadata": {
+        "id": "1BY0qUqTCrMq",
+        "colab_type": "code",
+        "colab": {}
+      },
+      "source": [
+        ""
+      ],
+      "execution_count": 0,
+      "outputs": []
+    }
+  ]
+}