sunxvming
diff --git a/‎make-your-own-neural-network/pytorch_neural_network_mnist_data.ipynb
Lines changed: 258 additions & 0 deletions b/‎make-your-own-neural-network/pytorch_neural_network_mnist_data.ipynb
Lines changed: 258 additions & 0 deletions
@@ -0,0 +1,258 @@
+{
+ "cells": [
+  {
+   "cell_type": "code",
+   "execution_count": 37,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import torch\n",
+    "from torch.autograd import Variable\n",
+    "import torch.nn as nn\n",
+    "\n",
+    "import numpy"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 38,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "class NeuralNetwork(nn.Module):\n",
+    "\n",
+    "    def __init__(self, inodes, hnodes, onodes, learning_rate):\n",
+    "        # call the base class's initialisation too\n",
+    "        super().__init__()\n",
+    "        \n",
+    "        # dimensions\n",
+    "        self.inodes = inodes\n",
+    "        self.hnodes = hnodes\n",
+    "        self.onodes = onodes\n",
+    "        \n",
+    "        # learning rate\n",
+    "        self.lr = learning_rate\n",
+    "        \n",
+    "        # define the layers and their sizes, turn off bias\n",
+    "        self.linear_ih = nn.Linear(inodes, hnodes, bias=False)\n",
+    "        self.linear_ho = nn.Linear(hnodes, onodes, bias=False)\n",
+    "        \n",
+    "        # define activation function\n",
+    "        self.activation = nn.Sigmoid()\n",
+    "        \n",
+    "        # create error function\n",
+    "        self.error_function = torch.nn.MSELoss(size_average=False)\n",
+    "\n",
+    "        # create optimiser, using simple stochastic gradient descent\n",
+    "        self.optimiser = torch.optim.SGD(self.parameters(), self.lr)\n",
+    "\n",
+    "        pass\n",
+    "\n",
+    "    \n",
+    "    def forward(self, inputs_list):\n",
+    "        # convert list to a 2-D FloatTensor then wrap in Variable \n",
+    "        # also shift to GPU, remove .cuda. if not desired\n",
+    "        # inputs = Variable(torch.cuda.FloatTensor(inputs_list).view(1, self.inodes))\n",
+    "        inputs = Variable(torch.FloatTensor(inputs_list).view(1, self.inodes))\n",
+    "        \n",
+    "        # combine input layer signals into hidden layer\n",
+    "        hidden_inputs = self.linear_ih(inputs)\n",
+    "        # apply sigmiod activation function\n",
+    "        hidden_outputs = self.activation(hidden_inputs)\n",
+    "        \n",
+    "        # combine hidden layer signals into output layer\n",
+    "        final_inputs = self.linear_ho(hidden_outputs)\n",
+    "        # apply sigmiod activation function\n",
+    "        final_outputs = self.activation(final_inputs)\n",
+    "        \n",
+    "        return final_outputs\n",
+    "\n",
+    "    \n",
+    "    def train(self, inputs_list, targets_list):\n",
+    "        # calculate the output of the network\n",
+    "        output = self.forward(inputs_list)\n",
+    "\n",
+    "        # create a Variable out of the target vector, doesn't need gradients calculated\n",
+    "        # also shift to GPU, remove .cuda. if not desired\n",
+    "        # target_variable = Variable(torch.cuda.FloatTensor(targets_list).view(1, self.onodes), requires_grad=False)\n",
+    "        target_variable = Variable(torch.FloatTensor(targets_list).view(1, self.onodes), requires_grad=False)\n",
+    "        \n",
+    "        # calculate error\n",
+    "        loss = self.error_function(output, target_variable)\n",
+    "        #print(loss.data[0])\n",
+    "\n",
+    "        # zero gradients, perform a backward pass, and update the weights.\n",
+    "        self.optimiser.zero_grad()\n",
+    "        loss.backward()\n",
+    "        self.optimiser.step()\n",
+    "        pass\n",
+    "\n",
+    "    pass"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 39,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# number of input, hidden and output nodes\n",
+    "input_nodes = 784\n",
+    "hidden_nodes = 200\n",
+    "output_nodes = 10\n",
+    "\n",
+    "# learning rate\n",
+    "learning_rate = 0.1\n",
+    "\n",
+    "# create instance of neural network\n",
+    "n = NeuralNetwork(input_nodes,hidden_nodes,output_nodes, learning_rate)\n",
+    "\n",
+    "# move neural network to the GPU, delete if not desired\n",
+    "# n.cuda()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 40,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# load the mnist training data CSV file into a list\n",
+    "training_data_file = open(\"mnist_dataset/mnist_train.csv\", 'r')\n",
+    "training_data_list = training_data_file.readlines()\n",
+    "training_data_file.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 41,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# %%timeit -n1 -r1 -c\n",
+    "\n",
+    "# train the neural network\n",
+    "\n",
+    "# epochs is the number of times the training data set is used for training\n",
+    "epochs = 5\n",
+    "\n",
+    "for e in range(epochs):\n",
+    "    # go through all records in the training data set\n",
+    "    for record in training_data_list:\n",
+    "        # split the record by the ',' commas\n",
+    "        all_values = record.split(',')\n",
+    "        # scale and shift the inputs\n",
+    "        inputs = (numpy.asfarray(all_values[1:]) / 255.0 * 0.99) + 0.01\n",
+    "        # create the target output values (all 0.01, except the desired label which is 0.99)\n",
+    "        targets = numpy.zeros(output_nodes) + 0.01\n",
+    "        # all_values[0] is the target label for this record\n",
+    "        targets[int(all_values[0])] = 0.99\n",
+    "        n.train(inputs, targets)\n",
+    "        pass\n",
+    "    pass"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 42,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "## load the mnist test data CSV file into a list\n",
+    "test_data_file = open(\"mnist_dataset/mnist_test.csv\", 'r')\n",
+    "test_data_list = test_data_file.readlines()\n",
+    "test_data_file.close()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 43,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "# test the neural network\n",
+    "\n",
+    "# scorecard for how well the network performs, initially empty\n",
+    "scorecard = []\n",
+    "\n",
+    "# go through all the records in the test data set\n",
+    "for record in test_data_list:\n",
+    "    # split the record by the ',' commas\n",
+    "    all_values = record.split(',')\n",
+    "    # correct answer is first value\n",
+    "    correct_label = int(all_values[0])\n",
+    "    # scale and shift the inputs\n",
+    "    inputs = (numpy.asfarray(all_values[1:]) / 255.0 * 0.99) + 0.01\n",
+    "    # query the network\n",
+    "    outputs = n.forward(inputs)\n",
+    "    # the index of the highest value corresponds to the label\n",
+    "    m, label = outputs.max(1)\n",
+    "    # append correct or incorrect to list\n",
+    "    # need to extract from pytorch tensor via numpy to compare to python integer\n",
+    "    # print(\"label.data:\",label.data[0])\n",
+    "    # print(\"correct_label:\",correct_label)\n",
+    "    if (label.data[0] == correct_label):\n",
+    "        # network's answer matches correct answer, add 1 to scorecard\n",
+    "        scorecard.append(1)\n",
+    "    else:\n",
+    "        # network's answer doesn't match correct answer, add 0 to scorecard\n",
+    "        scorecard.append(0)\n",
+    "        pass\n",
+    "    \n",
+    "    pass"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 44,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "performance =  0.5\n"
+     ]
+    }
+   ],
+   "source": [
+    "# calculate the performance score, the fraction of correct answers\n",
+    "scorecard_array = numpy.asarray(scorecard)\n",
+    "print (\"performance = \", scorecard_array.sum() / scorecard_array.size)"
+   ]
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.11.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}