MITDeepLearning
diff --git a/‎lab2/Part1_MNIST.ipynb‎
Lines changed: 37 additions & 21 deletions b/‎lab2/Part1_MNIST.ipynb‎
Lines changed: 37 additions & 21 deletions
@@ -10,9 +10,9 @@
         "  <td align=\"center\"><a target=\"_blank\" href=\"http://introtodeeplearning.com\">\n",
         "        <img src=\"https://i.ibb.co/Jr88sn2/mit.png\" style=\"padding-bottom:5px;\" />\n",
         "      Visit MIT Deep Learning</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab2/Part1_MNIST.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab2/solutions/Part1_MNIST_Solution.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/2P3SLwK/colab.png\"  style=\"padding-bottom:5px;\" />Run in Google Colab</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab2/Part1_MNIST.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab2/solutions/Part1_MNIST_Solution.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/xfJbPmL/github.png\"  height=\"70px\" style=\"padding-bottom:5px;\"  />View Source on GitHub</a></td>\n",
         "</table>\n",
         "\n",
@@ -62,6 +62,7 @@
       "outputs": [],
       "source": [
         "# Import Tensorflow 2.0\n",
+        "# !pip install tensorflow\n",
         "import tensorflow as tf\n",
         "\n",
         "# MIT introduction to deep learning package\n",
@@ -107,7 +108,7 @@
       "cell_type": "code",
       "source": [
         "# start a first comet experiment for the first part of the lab\n",
-        "comet_ml.init(project_name=\"6S191lab2_part1_NN\")\n",
+        "comet_ml.init(project_name=\"6S191_lab2_part1_NN\")\n",
         "comet_model_1 = comet_ml.Experiment()"
       ],
       "metadata": {
@@ -215,10 +216,12 @@
         "      tf.keras.layers.Flatten(),\n",
         "\n",
         "      # '''TODO: Define the activation function for the first fully connected (Dense) layer.'''\n",
-        "      tf.keras.layers.Dense(128, activation= '''TODO'''),\n",
+        "      tf.keras.layers.Dense(128, activation=tf.nn.relu),\n",
+        "      # tf.keras.layers.Dense(128, activation= '''TODO'''),\n",
         "\n",
         "      # '''TODO: Define the second Dense layer to output the classification probabilities'''\n",
-        "      [TODO Dense layer to output classification probabilities]\n",
+        "      tf.keras.layers.Dense(10, activation=tf.nn.softmax)\n",
+        "      # [TODO Dense layer to output classification probabilities]\n",
         "\n",
         "  ])\n",
         "  return fc_model\n",
@@ -345,7 +348,8 @@
       "outputs": [],
       "source": [
         "'''TODO: Use the evaluate method to test the model!'''\n",
-        "test_loss, test_acc = # TODO\n",
+        "test_loss, test_acc = model.evaluate(test_images, test_labels) # TODO\n",
+        "# test_loss, test_acc = # TODO\n",
         "\n",
         "print('Test accuracy:', test_acc)"
       ]
@@ -406,24 +410,29 @@
         "    cnn_model = tf.keras.Sequential([\n",
         "\n",
         "        # TODO: Define the first convolutional layer\n",
-        "        tf.keras.layers.Conv2D('''TODO''')\n",
+        "        tf.keras.layers.Conv2D(filters=24, kernel_size=(3,3), activation=tf.nn.relu),\n",
+        "        # tf.keras.layers.Conv2D('''TODO''')\n",
         "\n",
         "        # TODO: Define the first max pooling layer\n",
-        "        tf.keras.layers.MaxPool2D('''TODO''')\n",
+        "        tf.keras.layers.MaxPool2D(pool_size=(2,2)),\n",
+        "        # tf.keras.layers.MaxPool2D('''TODO''')\n",
         "\n",
         "        # TODO: Define the second convolutional layer\n",
-        "        tf.keras.layers.Conv2D('''TODO''')\n",
+        "        tf.keras.layers.Conv2D(filters=36, kernel_size=(3,3), activation=tf.nn.relu),\n",
+        "        # tf.keras.layers.Conv2D('''TODO''')\n",
         "\n",
         "        # TODO: Define the second max pooling layer\n",
-        "        tf.keras.layers.MaxPool2D('''TODO''')\n",
+        "        tf.keras.layers.MaxPool2D(pool_size=(2,2)),\n",
+        "        # tf.keras.layers.MaxPool2D('''TODO''')\n",
         "\n",
         "        tf.keras.layers.Flatten(),\n",
         "        tf.keras.layers.Dense(128, activation=tf.nn.relu),\n",
         "\n",
         "        # TODO: Define the last Dense layer to output the classification\n",
         "        # probabilities. Pay attention to the activation needed a probability\n",
         "        # output\n",
-        "        [TODO Dense layer to output classification probabilities]\n",
+        "        tf.keras.layers.Dense(10, activation=tf.nn.softmax)\n",
+        "        # [TODO Dense layer to output classification probabilities]\n",
         "    ])\n",
         "\n",
         "    return cnn_model\n",
@@ -458,7 +467,10 @@
         "comet_model_2 = comet_ml.Experiment()\n",
         "\n",
         "'''TODO: Define the compile operation with your optimizer and learning rate of choice'''\n",
-        "cnn_model.compile(optimizer='''TODO''', loss='''TODO''', metrics=['accuracy']) # TODO"
+        "cnn_model.compile(optimizer=tf.keras.optimizers.Adam(learning_rate=1e-3),\n",
+        "              loss='sparse_categorical_crossentropy',\n",
+        "              metrics=['accuracy'])\n",
+        "# cnn_model.compile(optimizer='''TODO''', loss='''TODO''', metrics=['accuracy']) # TODO"
       ]
     },
     {
@@ -479,8 +491,9 @@
       "outputs": [],
       "source": [
         "'''TODO: Use model.fit to train the CNN model, with the same batch_size and number of epochs previously used.'''\n",
-        "cnn_model.fit('''TODO''')\n",
-        "# comet_model_2.end() ## uncomment this line to end the comet experiment"
+        "cnn_model.fit(train_images, train_labels, batch_size=BATCH_SIZE, epochs=EPOCHS)\n",
+        "# cnn_model.fit('''TODO''')\n",
+        "# comet_model_2.end()"
       ]
     },
     {
@@ -501,7 +514,8 @@
       "outputs": [],
       "source": [
         "'''TODO: Use the evaluate method to test the model!'''\n",
-        "test_loss, test_acc = # TODO\n",
+        "test_loss, test_acc = cnn_model.evaluate(test_images, test_labels)\n",
+        "# test_loss, test_acc = # TODO\n",
         "\n",
         "print('Test accuracy:', test_acc)"
       ]
@@ -580,7 +594,8 @@
       "source": [
         "'''TODO: identify the digit with the highest confidence prediction for the first\n",
         "    image in the test dataset. '''\n",
-        "prediction = # TODO\n",
+        "prediction = np.argmax(predictions[0])\n",
+        "# prediction = # TODO\n",
         "\n",
         "print(prediction)"
       ]
@@ -710,21 +725,22 @@
         "  # GradientTape to record differentiation operations\n",
         "  with tf.GradientTape() as tape:\n",
         "    #'''TODO: feed the images into the model and obtain the predictions'''\n",
-        "    logits = # TODO\n",
+        "    logits = cnn_model(images)\n",
+        "    # logits = # TODO\n",
         "\n",
         "    #'''TODO: compute the categorical cross entropy loss\n",
-        "    loss_value = tf.keras.backend.sparse_categorical_crossentropy('''TODO''', '''TODO''') # TODO\n",
-        "\n",
-        "    # log the loss to comet\n",
+        "    loss_value = tf.keras.backend.sparse_categorical_crossentropy(labels, logits)\n",
         "    comet_model_3.log_metric(\"loss\", loss_value.numpy().mean(), step=idx)\n",
+        "    # loss_value = tf.keras.backend.sparse_categorical_crossentropy('''TODO''', '''TODO''') # TODO\n",
         "\n",
         "  loss_history.append(loss_value.numpy().mean()) # append the loss to the loss_history record\n",
         "  plotter.plot(loss_history.get())\n",
         "\n",
         "  # Backpropagation\n",
         "  '''TODO: Use the tape to compute the gradient against all parameters in the CNN model.\n",
         "      Use cnn_model.trainable_variables to access these parameters.'''\n",
-        "  grads = # TODO\n",
+        "  grads = tape.gradient(loss_value, cnn_model.trainable_variables)\n",
+        "  # grads = # TODO\n",
         "  optimizer.apply_gradients(zip(grads, cnn_model.trainable_variables))\n",
         "\n",
         "comet_model_3.log_figure(figure=plt)\n",