eigenfoo-archives
diff --git a/‎.DS_Store
6 KB b/‎.DS_Store
6 KB
diff --git a/‎doc/.DS_Store
6 KB b/‎doc/.DS_Store
6 KB
diff --git a/‎doc/assignment_prompt.pdf
108 KB b/‎doc/assignment_prompt.pdf
108 KB
diff --git a/‎neural_net/.ipynb_checkpoints/neural_net-checkpoint.ipynb
+250 b/‎neural_net/.ipynb_checkpoints/neural_net-checkpoint.ipynb
+250
@@ -0,0 +1,250 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# AI Assignment 2: Neural Network"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "import numpy as np"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "def sigmoid(z):\n",
+    "    '''The sigmoid function'''\n",
+    "    return 1.0 / (1.0 + np.exp(-z))\n",
+    "\n",
+    "def sigmoid_prime(z):\n",
+    "    '''Derivative of the sigmoid function'''\n",
+    "    return sigmoid(z) * (1-sigmoid(z))"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 32,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def read_neural_net_file(nn_filename):\n",
+    "    '''\n",
+    "    Reads neural net initialization file\n",
+    "    '''\n",
+    "    \n",
+    "    with open(nn_filename) as f:\n",
+    "        line = f.readline()\n",
+    "        nums = [int(num) for num in line.split()]\n",
+    "        Ni, Nh, No = nums\n",
+    "\n",
+    "        b1 = np.zeros([Nh, 1])\n",
+    "        w1 = np.zeros([Nh, Ni])\n",
+    "\n",
+    "        for i in range(Nh):\n",
+    "            line = f.readline()\n",
+    "            nums = [float(num) for num in line.split()]\n",
+    "            b1[i] = nums[0]\n",
+    "            w1[i, :] = nums[1:]\n",
+    "\n",
+    "        b2 = np.zeros([No, 1])\n",
+    "        w2 = np.zeros([No, Nh])\n",
+    "\n",
+    "        for i in range(No):\n",
+    "            line = f.readline()\n",
+    "            nums = [float(num) for num in line.split()]\n",
+    "            b2[i] = nums[0]\n",
+    "            w2[i, :] = nums[1:]\n",
+    "\n",
+    "    return Ni, Nh, No, b1, w1, b2, w2"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 35,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def read_train_file(train_filename):\n",
+    "    '''\n",
+    "    Reads training file\n",
+    "    '''\n",
+    "    \n",
+    "    with open('tests/wdbc_train.txt') as f:\n",
+    "        line = f.readline()\n",
+    "        nums = [int(num) for num in line.split()]\n",
+    "        num_obs, Ni, No = nums\n",
+    "\n",
+    "        inputs = np.zeros([num_obs, Ni])\n",
+    "        outputs = np.zeros([num_obs, No])\n",
+    "\n",
+    "        for i in range(num_obs):\n",
+    "            line = f.readline()\n",
+    "            nums = [float(num) for num in line.split()]\n",
+    "            inputs[i, :] = nums[:Ni]\n",
+    "            outputs[i, :] = nums[Ni:]\n",
+    "            \n",
+    "    return inputs, outputs"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": [
+    "class NeuralNetwork(object):\n",
+    "    def __init__(self, neural_net_filename):\n",
+    "        self.Ni, self.Nh, self.No, self.b1, self.w1, self.b2, self.w2\n",
+    "            = read_neural_net_file(neural_net_filename)\n",
+    "\n",
+    "\n",
+    "    def feedforward(self, a):\n",
+    "        \"\"\"Return the output of the network if ``a`` is input.\"\"\"\n",
+    "        for b, w in zip(self.biases, self.weights):\n",
+    "            a = sigmoid(np.dot(w, a)+b)\n",
+    "        return a\n",
+    "    \n",
+    "    \n",
+    "    def SGD(self, training_data, epochs, mini_batch_size, eta,\n",
+    "            test_data=None):\n",
+    "        \"\"\"Train the neural network using mini-batch stochastic\n",
+    "        gradient descent.  The ``training_data`` is a list of tuples\n",
+    "        ``(x, y)`` representing the training inputs and the desired\n",
+    "        outputs.  The other non-optional parameters are\n",
+    "        self-explanatory.  If ``test_data`` is provided then the\n",
+    "        network will be evaluated against the test data after each\n",
+    "        epoch, and partial progress printed out.  This is useful for\n",
+    "        tracking progress, but slows things down substantially.\"\"\"\n",
+    "        if test_data: n_test = len(test_data)\n",
+    "        n = len(training_data)\n",
+    "        for j in xrange(epochs):\n",
+    "            random.shuffle(training_data)\n",
+    "            mini_batches = [\n",
+    "                training_data[k:k+mini_batch_size]\n",
+    "                for k in xrange(0, n, mini_batch_size)]\n",
+    "            for mini_batch in mini_batches:\n",
+    "                self.update_mini_batch(mini_batch, eta)\n",
+    "            if test_data:\n",
+    "                print \"Epoch {0}: {1} / {2}\".format(\n",
+    "                    j, self.evaluate(test_data), n_test)\n",
+    "            else:\n",
+    "                print \"Epoch {0} complete\".format(j)\n",
+    "\n",
+    "                \n",
+    "    def update_mini_batch(self, mini_batch, eta):\n",
+    "        \"\"\"Update the network's weights and biases by applying\n",
+    "        gradient descent using backpropagation to a single mini batch.\n",
+    "        The ``mini_batch`` is a list of tuples ``(x, y)``, and ``eta``\n",
+    "        is the learning rate.\"\"\"\n",
+    "        nabla_b = [np.zeros(b.shape) for b in self.biases]\n",
+    "        nabla_w = [np.zeros(w.shape) for w in self.weights]\n",
+    "        for x, y in mini_batch:\n",
+    "            delta_nabla_b, delta_nabla_w = self.backprop(x, y)\n",
+    "            nabla_b = [nb+dnb for nb, dnb in zip(nabla_b, delta_nabla_b)]\n",
+    "            nabla_w = [nw+dnw for nw, dnw in zip(nabla_w, delta_nabla_w)]\n",
+    "        self.weights = [w-(eta/len(mini_batch))*nw\n",
+    "                        for w, nw in zip(self.weights, nabla_w)]\n",
+    "        self.biases = [b-(eta/len(mini_batch))*nb\n",
+    "                       for b, nb in zip(self.biases, nabla_b)]\n",
+    "\n",
+    "        \n",
+    "    def backprop(self, x, y):\n",
+    "        \"\"\"Return a tuple ``(nabla_b, nabla_w)`` representing the\n",
+    "        gradient for the cost function C_x.  ``nabla_b`` and\n",
+    "        ``nabla_w`` are layer-by-layer lists of numpy arrays, similar\n",
+    "        to ``self.biases`` and ``self.weights``.\"\"\"\n",
+    "        nabla_b = [np.zeros(b.shape) for b in self.biases]\n",
+    "        nabla_w = [np.zeros(w.shape) for w in self.weights]\n",
+    "        # feedforward\n",
+    "        activation = x\n",
+    "        activations = [x] # list to store all the activations, layer by layer\n",
+    "        zs = [] # list to store all the z vectors, layer by layer\n",
+    "        for b, w in zip(self.biases, self.weights):\n",
+    "            z = np.dot(w, activation)+b\n",
+    "            zs.append(z)\n",
+    "            activation = sigmoid(z)\n",
+    "            activations.append(activation)\n",
+    "        # backward pass\n",
+    "        delta = self.cost_derivative(activations[-1], y) * \\\n",
+    "            sigmoid_prime(zs[-1])\n",
+    "        nabla_b[-1] = delta\n",
+    "        nabla_w[-1] = np.dot(delta, activations[-2].transpose())\n",
+    "        # Note that the variable l in the loop below is used a little\n",
+    "        # differently to the notation in Chapter 2 of the book.  Here,\n",
+    "        # l = 1 means the last layer of neurons, l = 2 is the\n",
+    "        # second-last layer, and so on.  It's a renumbering of the\n",
+    "        # scheme in the book, used here to take advantage of the fact\n",
+    "        # that Python can use negative indices in lists.\n",
+    "        for l in xrange(2, self.num_layers):\n",
+    "            z = zs[-l]\n",
+    "            sp = sigmoid_prime(z)\n",
+    "            delta = np.dot(self.weights[-l+1].transpose(), delta) * sp\n",
+    "            nabla_b[-l] = delta\n",
+    "            nabla_w[-l] = np.dot(delta, activations[-l-1].transpose())\n",
+    "        return (nabla_b, nabla_w)\n",
+    "\n",
+    "    \n",
+    "    def evaluate(self, test_data):\n",
+    "        \"\"\"Return the number of test inputs for which the neural\n",
+    "        network outputs the correct result. Note that the neural\n",
+    "        network's output is assumed to be the index of whichever\n",
+    "        neuron in the final layer has the highest activation.\"\"\"\n",
+    "        test_results = [(np.argmax(self.feedforward(x)), y)\n",
+    "                        for (x, y) in test_data]\n",
+    "        return sum(int(x == y) for (x, y) in test_results)\n",
+    "\n",
+    "    \n",
+    "    def cost_derivative(self, output_activations, y):\n",
+    "        \"\"\"Return the vector of partial derivatives \\partial C_x /\n",
+    "        \\partial a for the output activations.\"\"\"\n",
+    "        return (output_activations-y)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": null,
+   "metadata": {
+    "collapsed": true
+   },
+   "outputs": [],
+   "source": []
+  }
+ ],
+ "metadata": {
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.6.1"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}