wenouyang
diff --git a/‎CNTK_CNN.ipynb
Lines changed: 55 additions & 43 deletions b/‎CNTK_CNN.ipynb
Lines changed: 55 additions & 43 deletions
@@ -26,6 +26,16 @@
    "cell_type": "code",
    "execution_count": 2,
    "metadata": {},
+   "outputs": [],
+   "source": [
+    "# Force one-gpu\n",
+    "os.environ[\"CUDA_VISIBLE_DEVICES\"] = \"0\""
+   ]
+  },
+  {
+   "cell_type": "code",
+   "execution_count": 3,
+   "metadata": {},
    "outputs": [
     {
      "name": "stdout",
@@ -34,9 +44,11 @@
       "OS:  linux\n",
       "Python:  3.5.2 |Anaconda custom (64-bit)| (default, Jul  2 2016, 17:53:06) \n",
       "[GCC 4.4.7 20120313 (Red Hat 4.4.7-1)]\n",
-      "Numpy:  1.13.3\n",
-      "CNTK:  2.2\n",
-      "GPU:  ['Tesla K80']\n"
+      "Numpy:  1.14.1\n",
+      "CNTK:  2.4\n",
+      "GPU:  ['Tesla P100-PCIE-16GB', 'Tesla P100-PCIE-16GB']\n",
+      "CUDA Version 8.0.61\n",
+      "CuDNN Version  6.0.21\n"
      ]
     }
    ],
@@ -45,16 +57,18 @@
     "print(\"Python: \", sys.version)\n",
     "print(\"Numpy: \", np.__version__)\n",
     "print(\"CNTK: \", cntk.__version__)\n",
-    "print(\"GPU: \", get_gpu_name())"
+    "print(\"GPU: \", get_gpu_name())\n",
+    "print(get_cuda_version())\n",
+    "print(\"CuDNN Version \", get_cudnn_version())"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 3,
+   "execution_count": 4,
    "metadata": {},
    "outputs": [],
    "source": [
-    "def create_symbol():\n",
+    "def create_symbol(n_classes=N_CLASSES):\n",
     "    # Weight initialiser from uniform distribution\n",
     "    # Activation (unless states) is None\n",
     "    with cntk.layers.default_options(init = cntk.glorot_uniform(), activation = cntk.relu):\n",
@@ -70,34 +84,34 @@
     "        \n",
     "        x = Dense(512)(x)\n",
     "        x = Dropout(0.5)(x)\n",
-    "        x = Dense(N_CLASSES, activation=None)(x)\n",
+    "        x = Dense(n_classes, activation=None)(x)\n",
     "        return x"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 4,
+   "execution_count": 5,
    "metadata": {},
    "outputs": [],
    "source": [
-    "def init_model(m):\n",
+    "def init_model(m, labels, lr=LR, momentum=MOMENTUM):\n",
     "    # Loss (dense labels); check if support for sparse labels\n",
     "    loss = cntk.cross_entropy_with_softmax(m, labels)  \n",
     "    # Momentum SGD\n",
     "    # https://github.com/Microsoft/CNTK/blob/master/Manual/Manual_How_to_use_learners.ipynb\n",
     "    # unit_gain=False: momentum_direction = momentum*old_momentum_direction + gradient\n",
     "    # if unit_gain=True then ...(1-momentum)*gradient\n",
     "    learner = cntk.momentum_sgd(m.parameters,\n",
-    "                                lr=cntk.learning_rate_schedule(LR, cntk.UnitType.minibatch) ,\n",
-    "                                momentum=cntk.momentum_schedule(MOMENTUM), \n",
+    "                                lr=cntk.learning_rate_schedule(lr, cntk.UnitType.minibatch) ,\n",
+    "                                momentum=cntk.momentum_schedule(momentum), \n",
     "                                unit_gain=False)\n",
     "    trainer = cntk.Trainer(m, (loss, cntk.classification_error(m, labels)), [learner])\n",
     "    return trainer"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 5,
+   "execution_count": 6,
    "metadata": {},
    "outputs": [
     {
@@ -108,8 +122,8 @@
       "Preparing test set...\n",
       "(50000, 3, 32, 32) (10000, 3, 32, 32) (50000, 10) (10000, 10)\n",
       "float32 float32 float32 float32\n",
-      "CPU times: user 833 ms, sys: 553 ms, total: 1.39 s\n",
-      "Wall time: 1.38 s\n"
+      "CPU times: user 671 ms, sys: 576 ms, total: 1.25 s\n",
+      "Wall time: 1.25 s\n"
      ]
     }
    ],
@@ -126,15 +140,15 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 6,
+   "execution_count": 7,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "CPU times: user 22.6 ms, sys: 28.6 ms, total: 51.2 ms\n",
-      "Wall time: 76.1 ms\n"
+      "CPU times: user 24 ms, sys: 32 ms, total: 56 ms\n",
+      "Wall time: 69 ms\n"
      ]
     }
    ],
@@ -149,51 +163,50 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 7,
+   "execution_count": 8,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "CPU times: user 72.1 ms, sys: 224 ms, total: 297 ms\n",
-      "Wall time: 303 ms\n"
+      "CPU times: user 119 ms, sys: 116 ms, total: 235 ms\n",
+      "Wall time: 236 ms\n"
      ]
     }
    ],
    "source": [
     "%%time\n",
-    "trainer = init_model(sym)"
+    "trainer = init_model(sym, labels)"
    ]
   },
   {
    "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": 9,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Epoch 1  |  Accuracy: 0.562500\n",
+      "Epoch 1  |  Accuracy: 0.468750\n",
       "Epoch 2  |  Accuracy: 0.640625\n",
-      "Epoch 3  |  Accuracy: 0.625000\n",
-      "Epoch 4  |  Accuracy: 0.703125\n",
-      "Epoch 5  |  Accuracy: 0.703125\n",
-      "Epoch 6  |  Accuracy: 0.765625\n",
-      "Epoch 7  |  Accuracy: 0.859375\n",
-      "Epoch 8  |  Accuracy: 0.796875\n",
-      "Epoch 9  |  Accuracy: 0.781250\n",
-      "Epoch 10  |  Accuracy: 0.796875\n",
-      "CPU times: user 2min 19s, sys: 21.4 s, total: 2min 40s\n",
-      "Wall time: 2min 43s\n"
+      "Epoch 3  |  Accuracy: 0.609375\n",
+      "Epoch 4  |  Accuracy: 0.578125\n",
+      "Epoch 5  |  Accuracy: 0.812500\n",
+      "Epoch 6  |  Accuracy: 0.781250\n",
+      "Epoch 7  |  Accuracy: 0.671875\n",
+      "Epoch 8  |  Accuracy: 0.843750\n",
+      "Epoch 9  |  Accuracy: 0.796875\n",
+      "Epoch 10  |  Accuracy: 0.843750\n",
+      "CPU times: user 40.3 s, sys: 13.1 s, total: 53.3 s\n",
+      "Wall time: 53.2 s\n"
      ]
     }
    ],
    "source": [
     "%%time \n",
-    "# 163s\n",
-    "# Train model\n",
+    "# Main training loop: 53s\n",
     "for j in range(EPOCHS):\n",
     "    for data, label in yield_mb(x_train, y_train, BATCHSIZE, shuffle=True):\n",
     "        trainer.train_minibatch({features: data, labels: label})\n",
@@ -204,22 +217,21 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 9,
+   "execution_count": 10,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "CPU times: user 850 ms, sys: 337 ms, total: 1.19 s\n",
-      "Wall time: 1.4 s\n"
+      "CPU times: user 291 ms, sys: 88.9 ms, total: 379 ms\n",
+      "Wall time: 408 ms\n"
      ]
     }
    ],
    "source": [
     "%%time\n",
-    "# Predict and then score accuracy\n",
-    "# (We don't need softmax -> monotonic function)\n",
+    "# Main evaluation loop: 343ms\n",
     "n_samples = (y_test.shape[0]//BATCHSIZE)*BATCHSIZE\n",
     "y_guess = np.zeros(n_samples, dtype=np.int)\n",
     "y_truth = np.argmax(y_test[:n_samples], axis=-1)\n",
@@ -232,14 +244,14 @@
   },
   {
    "cell_type": "code",
-   "execution_count": 10,
+   "execution_count": 11,
    "metadata": {},
    "outputs": [
     {
      "name": "stdout",
      "output_type": "stream",
      "text": [
-      "Accuracy:  0.780649038462\n"
+      "Accuracy:  0.7701322115384616\n"
      ]
     }
    ],
@@ -251,7 +263,7 @@
  "metadata": {
   "anaconda-cloud": {},
   "kernelspec": {
-   "display_name": "Python [default]",
+   "display_name": "Python 3",
    "language": "python",
    "name": "python3"
   },