tf l2p2 student

avaamini · avaamini · commit 963f1822911e · 2025-01-05T12:39:39.000-05:00
diff --git a/lab2/TF_Part2_Debiasing.ipynb b/lab2/TF_Part2_Debiasing.ipynb
@@ -27,9 +27,9 @@
         "  <td align=\"center\"><a target=\"_blank\" href=\"http://introtodeeplearning.com\">\n",
         "        <img src=\"https://i.ibb.co/Jr88sn2/mit.png\" style=\"padding-bottom:5px;\" />\n",
         "      Visit MIT Deep Learning</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab2/solutions/TF_Part2_Debiasing_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab2/TF_Part2_Debiasing.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/2P3SLwK/colab.png\"  style=\"padding-bottom:5px;\" />Run in Google Colab</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab2/solutions/TF_Part2_Debiasing_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab2/TF_Part2_Debiasing.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/xfJbPmL/github.png\"  height=\"70px\" style=\"padding-bottom:5px;\"  />View Source on GitHub</a></td>\n",
         "</table>\n",
         "\n",
@@ -568,22 +568,19 @@
         "def vae_loss_function(x, x_recon, mu, logsigma, kl_weight=0.0005):\n",
         "  # TODO: Define the latent loss. Note this is given in the equation for L_{KL}\n",
         "  # in the text block directly above\n",
-        "  latent_loss = 0.5 * tf.reduce_sum(tf.exp(logsigma) + tf.square(mu) - 1.0 - logsigma, axis=1)\n",
-        "  # latent_loss = # TODO\n",
+        "  latent_loss = # TODO\n",
         "\n",
         "  # TODO: Define the reconstruction loss as the mean absolute pixel-wise\n",
         "  # difference between the input and reconstruction. Hint: you'll need to\n",
         "  # use tf.reduce_mean, and supply an axis argument which specifies which\n",
         "  # dimensions to reduce over. For example, reconstruction loss needs to average\n",
         "  # over the height, width, and channel image dimensions.\n",
         "  # https://www.tensorflow.org/api_docs/python/tf/math/reduce_mean\n",
-        "  reconstruction_loss = tf.reduce_mean(tf.abs(x-x_recon), axis=(1,2,3))\n",
-        "  # reconstruction_loss = # TODO\n",
+        "  reconstruction_loss = # TODO\n",
         "\n",
         "  # TODO: Define the VAE loss. Note this is given in the equation for L_{VAE}\n",
         "  # in the text block directly above\n",
-        "  vae_loss = kl_weight * latent_loss + reconstruction_loss\n",
-        "  # vae_loss = # TODO\n",
+        "  vae_loss = # TODO\n",
         "\n",
         "  return vae_loss"
       ],
@@ -637,8 +634,8 @@
         "\n",
         "  # TODO: Define the reparameterization computation!\n",
         "  # Note the equation is given in the text block immediately above.\n",
-        "  z = z_mean + tf.math.exp(0.5 * z_logsigma) * epsilon\n",
-        "  # z = # TODO\n",
+        "  z = # TODO\n",
+        "\n",
         "  return z"
       ],
       "execution_count": null,
@@ -722,25 +719,19 @@
         "def debiasing_loss_function(x, x_pred, y, y_logit, mu, logsigma):\n",
         "\n",
         "  # TODO: call the relevant function to obtain VAE loss\n",
-        "  vae_loss = vae_loss_function(x, x_pred, mu, logsigma)\n",
-        "  # vae_loss = vae_loss_function('''TODO''') # TODO\n",
+        "  vae_loss = vae_loss_function('''TODO''') # TODO\n",
         "\n",
         "  # TODO: define the classification loss using sigmoid_cross_entropy\n",
         "  # https://www.tensorflow.org/api_docs/python/tf/nn/sigmoid_cross_entropy_with_logits\n",
-        "  classification_loss = tf.nn.sigmoid_cross_entropy_with_logits(labels=y, logits=y_logit)\n",
-        "  # classification_loss = # TODO\n",
+        "  classification_loss = # TODO\n",
         "\n",
         "  # Use the training data labels to create variable face_indicator:\n",
         "  #   indicator that reflects which training data are images of faces\n",
         "  face_indicator = tf.cast(tf.equal(y, 1), tf.float32)\n",
         "\n",
         "  # TODO: define the DB-VAE total loss! Use tf.reduce_mean to average over all\n",
         "  # samples\n",
-        "  total_loss = tf.reduce_mean(\n",
-        "      classification_loss +\n",
-        "      face_indicator * vae_loss\n",
-        "  )\n",
-        "  # total_loss = # TODO\n",
+        "  total_loss = # TODO\n",
         "\n",
         "  return total_loss, classification_loss"
       ],
@@ -835,6 +826,7 @@
         "\n",
         "    # classification prediction\n",
         "    y_logit = tf.expand_dims(encoder_output[:, 0], -1)\n",
+        "\n",
         "    # latent variable distribution parameters\n",
         "    z_mean = encoder_output[:, 1:self.latent_dim+1]\n",
         "    z_logsigma = encoder_output[:, self.latent_dim+1:]\n",
@@ -844,15 +836,13 @@
         "  # VAE reparameterization: given a mean and logsigma, sample latent variables\n",
         "  def reparameterize(self, z_mean, z_logsigma):\n",
         "    # TODO: call the sampling function defined above\n",
-        "    z = sampling(z_mean, z_logsigma)\n",
-        "    # z = # TODO\n",
+        "    z = # TODO\n",
         "    return z\n",
         "\n",
         "  # Decode the latent space and output reconstruction\n",
         "  def decode(self, z):\n",
         "    # TODO: use the decoder to output the reconstruction\n",
-        "    reconstruction = self.decoder(z)\n",
-        "    # reconstruction = # TODO\n",
+        "    reconstruction = # TODO\n",
         "    return reconstruction\n",
         "\n",
         "  # The call function will be used to pass inputs x through the core VAE\n",
@@ -861,12 +851,10 @@
         "    y_logit, z_mean, z_logsigma = self.encode(x)\n",
         "\n",
         "    # TODO: reparameterization\n",
-        "    z = self.reparameterize(z_mean, z_logsigma)\n",
-        "    # z = # TODO\n",
+        "    z = # TODO\n",
         "\n",
         "    # TODO: reconstruction\n",
-        "    recon = self.decode(z)\n",
-        "    # recon = # TODO\n",
+        "    recon = # TODO\n",
         "    return y_logit, z_mean, z_logsigma, recon\n",
         "\n",
         "  # Predict face or not face logit for given input x\n",
@@ -956,8 +944,7 @@
         "    print(\"Recomputing the sampling probabilities\")\n",
         "\n",
         "    # TODO: run the input batch and get the latent variable means\n",
-        "    mu = get_latent_mu(images, dbvae)\n",
-        "    # mu = get_latent_mu('''TODO''') # TODO\n",
+        "    mu = get_latent_mu('''TODO''') # TODO\n",
         "\n",
         "    # sampling probabilities for the images\n",
         "    training_sample_p = np.zeros(mu.shape[0])\n",
@@ -976,8 +963,7 @@
         "        # TODO: call the digitize function to find which bins in the latent distribution\n",
         "        #    every data sample falls in to\n",
         "        # https://docs.scipy.org/doc/numpy-1.13.0/reference/generated/numpy.digitize.html\n",
-        "        bin_idx = np.digitize(latent_distribution, bin_edges)\n",
-        "        # bin_idx = np.digitize('''TODO''', '''TODO''') # TODO\n",
+        "        bin_idx = np.digitize('''TODO''', '''TODO''') # TODO\n",
         "\n",
         "        # smooth the density function\n",
         "        hist_smoothed_density = hist_density + smoothing_fac\n",
@@ -987,13 +973,11 @@
         "        p = 1.0/(hist_smoothed_density[bin_idx-1])\n",
         "\n",
         "        # TODO: normalize all probabilities\n",
-        "        p = p / np.sum(p)\n",
-        "        # p = # TODO\n",
+        "        p = # TODO\n",
         "\n",
         "        # TODO: update sampling probabilities by considering whether the newly\n",
         "        #     computed p is greater than the existing sampling probabilities.\n",
-        "        training_sample_p = np.maximum(p, training_sample_p)\n",
-        "        # training_sample_p = # TODO\n",
+        "        training_sample_p = # TODO\n",
         "\n",
         "    # final normalization\n",
         "    training_sample_p /= np.sum(training_sample_p)\n",
@@ -1044,13 +1028,11 @@
         "    y_logit, z_mean, z_logsigma, x_recon = dbvae(x)\n",
         "\n",
         "    '''TODO: call the DB_VAE loss function to compute the loss'''\n",
-        "    loss, class_loss = debiasing_loss_function(x, x_recon, y, y_logit, z_mean, z_logsigma)\n",
-        "    # loss, class_loss = debiasing_loss_function('''TODO arguments''') # TODO\n",
+        "    loss, class_loss = debiasing_loss_function('''TODO arguments''') # TODO\n",
         "\n",
         "  '''TODO: use the GradientTape.gradient method to compute the gradients.\n",
         "     Hint: this is with respect to the trainable_variables of the dbvae.'''\n",
-        "  grads = tape.gradient(loss, dbvae.trainable_variables)\n",
-        "  # grads = tape.gradient('''TODO''', '''TODO''') # TODO\n",
+        "  grads = tape.gradient('''TODO''', '''TODO''') # TODO\n",
         "\n",
         "  # apply gradients to variables\n",
         "  optimizer.apply_gradients(zip(grads, dbvae.trainable_variables))\n",
@@ -1070,8 +1052,7 @@
         "\n",
         "  # Recompute data sampling proabilities\n",
         "  '''TODO: recompute the sampling probabilities for debiasing'''\n",
-        "  p_faces = get_training_sample_probabilities(all_faces, dbvae)\n",
-        "  # p_faces = get_training_sample_probabilities('''TODO''', '''TODO''') # TODO\n",
+        "  p_faces = get_training_sample_probabilities('''TODO''', '''TODO''') # TODO\n",
         "\n",
         "  # get a batch of training data and compute the training step\n",
         "  for j in tqdm(range(loader.get_train_size() // params[\"batch_size\"])):\n",
@@ -1163,4 +1144,4 @@
       ]
     }
   ]
-}
+}