wenouyang
diff --git a/‎notebooks/CNTK_CNN_highAPI.ipynb
Lines changed: 301 additions & 0 deletions b/‎notebooks/CNTK_CNN_highAPI.ipynb
Lines changed: 301 additions & 0 deletions
@@ -0,0 +1,301 @@
+{
+ "cells": [
+  {
+   "cell_type": "markdown",
+   "metadata": {},
+   "source": [
+    "# High-level CNTK Example"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 1,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "import numpy as np\n",
+    "import os\n",
+    "import sys\n",
+    "import cntk\n",
+    "from cntk.layers import Convolution2D, MaxPooling, Dense, Dropout\n",
+    "from common.params import *\n",
+    "from common.utils import *"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 2,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Force one-gpu\n",
+    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"0\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "OS:  linux\n",
+      "Python:  3.5.2 |Anaconda custom (64-bit)| (default, Jul  2 2016, 17:53:06) \n",
+      "[GCC 4.4.7 20120313 (Red Hat 4.4.7-1)]\n",
+      "Numpy:  1.14.1\n",
+      "CNTK:  2.4\n",
+      "GPU:  ['Tesla P100-PCIE-16GB', 'Tesla P100-PCIE-16GB']\n",
+      "CUDA Version 8.0.61\n",
+      "CuDNN Version  6.0.21\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(\"OS: \", sys.platform)\n",
+    "print(\"Python: \", sys.version)\n",
+    "print(\"Numpy: \", np.__version__)\n",
+    "print(\"CNTK: \", cntk.__version__)\n",
+    "print(\"GPU: \", get_gpu_name())\n",
+    "print(get_cuda_version())\n",
+    "print(\"CuDNN Version \", get_cudnn_version())"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 4,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def create_symbol(n_classes=N_CLASSES):\n",
+    "    # Weight initialiser from uniform distribution\n",
+    "    # Activation (unless states) is None\n",
+    "    with cntk.layers.default_options(init = cntk.glorot_uniform(), activation = cntk.relu):\n",
+    "        x = Convolution2D(filter_shape=(3, 3), num_filters=50, pad=True)(features)\n",
+    "        x = Convolution2D(filter_shape=(3, 3), num_filters=50, pad=True)(x)\n",
+    "        x = MaxPooling((2, 2), strides=(2, 2), pad=False)(x)\n",
+    "        x = Dropout(0.25)(x)\n",
+    "\n",
+    "        x = Convolution2D(filter_shape=(3, 3), num_filters=100, pad=True)(x)\n",
+    "        x = Convolution2D(filter_shape=(3, 3), num_filters=100, pad=True)(x)\n",
+    "        x = MaxPooling((2, 2), strides=(2, 2), pad=False)(x)\n",
+    "        x = Dropout(0.25)(x)    \n",
+    "        \n",
+    "        x = Dense(512)(x)\n",
+    "        x = Dropout(0.5)(x)\n",
+    "        x = Dense(n_classes, activation=None)(x)\n",
+    "        return x"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 5,
+   "metadata": {},
+   "outputs": [],
+   "source": [
+    "def init_model(m, labels, lr=LR, momentum=MOMENTUM):\n",
+    "    # Loss (dense labels); check if support for sparse labels\n",
+    "    loss = cntk.cross_entropy_with_softmax(m, labels)\n",
+    "    # Momentum SGD\n",
+    "    # https://github.com/Microsoft/CNTK/blob/master/Manual/Manual_How_to_use_learners.ipynb\n",
+    "    # unit_gain=False: momentum_direction = momentum*old_momentum_direction + gradient\n",
+    "    # if unit_gain=True then ...(1-momentum)*gradient\n",
+    "    learner = cntk.momentum_sgd(m.parameters, \n",
+    "                                lr=cntk.learning_rate_schedule(lr, cntk.UnitType.minibatch) , \n",
+    "                                momentum=cntk.momentum_schedule(momentum),\n",
+    "                                unit_gain=False)\n",
+    "    return loss, learner"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 6,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Preparing train set...\n",
+      "Preparing test set...\n",
+      "(50000, 3, 32, 32) (10000, 3, 32, 32) (50000, 10) (10000, 10)\n",
+      "float32 float32 float32 float32\n",
+      "CPU times: user 738 ms, sys: 575 ms, total: 1.31 s\n",
+      "Wall time: 1.31 s\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# Data into format for library\n",
+    "x_train, x_test, y_train, y_test = cifar_for_library(channel_first=True, one_hot=True)\n",
+    "# CNTK format\n",
+    "y_train = y_train.astype(np.float32)\n",
+    "y_test = y_test.astype(np.float32)\n",
+    "print(x_train.shape, x_test.shape, y_train.shape, y_test.shape)\n",
+    "print(x_train.dtype, x_test.dtype, y_train.dtype, y_test.dtype)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 7,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 16.7 ms, sys: 40.4 ms, total: 57.1 ms\n",
+      "Wall time: 67.4 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# Placeholders\n",
+    "features = cntk.input_variable((3, 32, 32), np.float32)\n",
+    "labels = cntk.input_variable(N_CLASSES, np.float32)\n",
+    "# Load symbol\n",
+    "sym = create_symbol()"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 8,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 122 ms, sys: 116 ms, total: 238 ms\n",
+      "Wall time: 239 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "loss, learner = init_model(sym, labels)"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 9,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 37.9 s, sys: 10.8 s, total: 48.7 s\n",
+      "Wall time: 48.8 s\n"
+     ]
+    },
+    {
+     "data": {
+      "text/plain": [
+       "{'epoch_summaries': [{'loss': 1.8144259375, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 1.36322234375, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 1.122504140625, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.974794296875, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.8672890625, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.7853078125, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.716815546875, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.65541078125, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.606273671875, 'metric': 0.0, 'samples': 50000},\n",
+       "  {'loss': 0.560514921875, 'metric': 0.0, 'samples': 50000}],\n",
+       " 'updates': [{'loss': 1.8144589081005922, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 1.363123699583867, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 1.1224501996889005, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.9746546238546335, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.8671638205475752, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.7853081736155569, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.7168769787582027, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.6554993300981314, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.6063771656930218, 'metric': 0.0, 'samples': 49984},\n",
+       "  {'loss': 0.5606013064805738, 'metric': 0.0, 'samples': 49984}]}"
+      ]
+     },
+     "execution_count": 9,
+     "metadata": {},
+     "output_type": "execute_result"
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# Main training loop: 49s\n",
+    "loss.train((x_train, y_train), \n",
+    "           minibatch_size=BATCHSIZE, \n",
+    "           max_epochs=EPOCHS,\n",
+    "           parameter_learners=[learner])"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 10,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "CPU times: user 284 ms, sys: 95.9 ms, total: 380 ms\n",
+      "Wall time: 409 ms\n"
+     ]
+    }
+   ],
+   "source": [
+    "%%time\n",
+    "# Main evaluation loop: 409ms\n",
+    "n_samples = (y_test.shape[0]//BATCHSIZE)*BATCHSIZE\n",
+    "y_guess = np.zeros(n_samples, dtype=np.int)\n",
+    "y_truth = np.argmax(y_test[:n_samples], axis=-1)\n",
+    "c = 0\n",
+    "for data, label in yield_mb(x_test, y_test, BATCHSIZE):\n",
+    "    predicted_label_probs = sym.eval({features : data})\n",
+    "    y_guess[c*BATCHSIZE:(c+1)*BATCHSIZE] = np.argmax(predicted_label_probs, axis=-1)\n",
+    "    c += 1"
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 11,
+   "metadata": {},
+   "outputs": [
+    {
+     "name": "stdout",
+     "output_type": "stream",
+     "text": [
+      "Accuracy:  0.7591145833333334\n"
+     ]
+    }
+   ],
+   "source": [
+    "print(\"Accuracy: \", 1.*sum(y_guess == y_truth)/len(y_guess))"
+   ]
+  }
+ ],
+ "metadata": {
+  "anaconda-cloud": {},
+  "kernelspec": {
+   "display_name": "Python 3",
+   "language": "python",
+   "name": "python3"
+  },
+  "language_info": {
+   "codemirror_mode": {
+    "name": "ipython",
+    "version": 3
+   },
+   "file_extension": ".py",
+   "mimetype": "text/x-python",
+   "name": "python",
+   "nbconvert_exporter": "python",
+   "pygments_lexer": "ipython3",
+   "version": "3.5.2"
+  }
+ },
+ "nbformat": 4,
+ "nbformat_minor": 2
+}