pt l1p2 student

avaamini · avaamini · commit 4fad6a372905 · 2025-01-04T23:10:09.000-05:00
diff --git a/lab1/PT_Part2_Music_Generation.ipynb b/lab1/PT_Part2_Music_Generation.ipynb
@@ -10,9 +10,9 @@
         "  <td align=\"center\"><a target=\"_blank\" href=\"http://introtodeeplearning.com\">\n",
         "        <img src=\"https://i.ibb.co/Jr88sn2/mit.png\" style=\"padding-bottom:5px;\" />\n",
         "      Visit MIT Deep Learning</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab1/solutions/PT_Part2_Music_Generation_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://colab.research.google.com/github/aamini/introtodeeplearning/blob/master/lab1/PT_Part2_Music_Generation.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/2P3SLwK/colab.png\"  style=\"padding-bottom:5px;\" />Run in Google Colab</a></td>\n",
-        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab1/solutions/PT_Part2_Music_Generation_Solution.ipynb\">\n",
+        "  <td align=\"center\"><a target=\"_blank\" href=\"https://github.com/aamini/introtodeeplearning/blob/master/lab1/PT_Part2_Music_Generation.ipynb\">\n",
         "        <img src=\"https://i.ibb.co/xfJbPmL/github.png\"  height=\"70px\" style=\"padding-bottom:5px;\"  />View Source on GitHub</a></td>\n",
         "</table>\n",
         "\n",
@@ -61,7 +61,7 @@
         "First, let's download the course repository, install dependencies, and import the relevant packages we'll need for this lab.\n",
         "\n",
         "We will be using [Comet ML](https://www.comet.com/docs/v2/) to track our model development and training runs. First, sign up for a Comet account [at this link](https://www.comet.com/signup?utm_source=mit_dl&utm_medium=partner&utm_content=github\n",
-        ") (you can use your Google or Github account). This will generate a personal API Key, which you can find either in the first 'Get Started with Comet' page, under your account settings, or by pressing the '?' in the top right corner and then 'Quickstart Guide'. Enter this API key as the global variable `COMET_API_KEY`."
+        ") (you can use your Google or Github account). You will need to generate a new personal API Key, which you can find either in the first 'Get Started with Comet' page, under your account settings, or by pressing the '?' in the top right corner and then 'Quickstart Guide'. Enter this API key as the global variable `COMET_API_KEY`."
       ]
     },
     {
@@ -269,11 +269,7 @@
         "  the number of characters in the input string\n",
         "'''\n",
         "def vectorize_string(string):\n",
-        "  vectorized_output = np.array([char2idx[char] for char in string])\n",
-        "  return vectorized_output\n",
-        "\n",
-        "# def vectorize_string(string):\n",
-        "  # TODO\n",
+        "  '''TODO'''\n",
         "\n",
         "vectorized_songs = vectorize_string(songs_joined)"
       ]
@@ -332,10 +328,10 @@
         "    idx = np.random.choice(n - seq_length, batch_size)\n",
         "\n",
         "    '''TODO: construct a list of input sequences for the training batch'''\n",
-        "    input_batch = [vectorized_songs[i: i + seq_length] for i in idx]\n",
+        "    input_batch = # TODO\n",
         "\n",
         "    '''TODO: construct a list of output sequences for the training batch'''\n",
-        "    output_batch = [vectorized_songs[i + 1: i + seq_length + 1] for i in idx]\n",
+        "    output_batch = # TODO\n",
         "\n",
         "    # Convert the input and output batches to tensors\n",
         "    x_batch = torch.tensor(input_batch, dtype=torch.long)\n",
@@ -454,16 +450,13 @@
         "        #   of a fixed embedding size\n",
         "        self.embedding = nn.Embedding(vocab_size, embedding_dim)\n",
         "\n",
-        "        # Layer 2: LSTM with hidden_size `hidden_size`. note: number of layers defaults to 1.\n",
-        "        # TODO: Use the nn.LSTM() module from pytorch.\n",
-        "        self.lstm = nn.LSTM(embedding_dim, hidden_size, batch_first=True)\n",
-        "        # self.lstm = nn.LSTM('''TODO''')\n",
+        "        '''TODO: Layer 2: LSTM with hidden_size `hidden_size`. note: number of layers defaults to 1.\n",
+        "         Use the nn.LSTM() module from pytorch.'''\n",
+        "        self.lstm = nn.LSTM('''TODO''') # TODO\n",
         "\n",
-        "        # Layer 3: Linear (fully-connected) layer that transforms the LSTM output\n",
-        "        #   into the vocabulary size.\n",
-        "        # TODO: Add the Linear layer.\n",
-        "        self.fc = nn.Linear(hidden_size, vocab_size)\n",
-        "        # self.fc = nn.Linear('''TODO''')\n",
+        "        '''TODO: Layer 3: Linear (fully-connected) layer that transforms the LSTM output\n",
+        "        #   into the vocabulary size.'''\n",
+        "        self.fc = nn.Linear('''TODO''') # TODO\n",
         "\n",
         "    def init_hidden(self, batch_size, device):\n",
         "        # Initialize hidden state and cell state with zeros\n",
@@ -650,12 +643,10 @@
         "    batched_labels = labels.view(-1)\n",
         "\n",
         "    ''' TODO: Batch the logits so that the shape of the logits should be (B * L, V) '''\n",
-        "    batched_logits = logits.view(-1, logits.size(-1))\n",
-        "    # batched_logits = \"\"\" TODO \"\"\" # TODO\n",
+        "    batched_logits = \"\"\" TODO \"\"\" # TODO\n",
         "\n",
         "    '''TODO: Compute the cross-entropy loss using the batched  next characters and predictions'''\n",
-        "    loss = cross_entropy(batched_logits, batched_labels)\n",
-        "    # loss = \"\"\" TODO \"\"\" # TODO\n",
+        "    loss = \"\"\" TODO \"\"\" # TODO\n",
         "    return loss"
       ]
     },
@@ -668,8 +659,7 @@
         "\n",
         "'''TODO: compute the loss using the true next characters from the example batch\n",
         "    and the predictions from the untrained model several cells above'''\n",
-        "example_batch_loss = compute_loss(y, pred)\n",
-        "# example_batch_loss = compute_loss('''TODO''', '''TODO''') # TODO\n",
+        "example_batch_loss = compute_loss('''TODO''', '''TODO''') # TODO\n",
         "\n",
         "print(f\"Prediction shape: {pred.shape} # (batch_size, sequence_length, vocab_size)\")\n",
         "print(f\"scalar_loss:      {example_batch_loss.mean().item()}\")"
@@ -779,8 +769,7 @@
         "\n",
         "'''TODO: instantiate a new LSTMModel model for training using the hyperparameters\n",
         "    created above.'''\n",
-        "model = LSTMModel(vocab_size, params[\"embedding_dim\"], params[\"hidden_size\"])\n",
-        "# model = LSTMModel('''TODO: arguments''')\n",
+        "model = LSTMModel('''TODO: arguments''')\n",
         "\n",
         "# Move the model to the GPU\n",
         "model.to(device)\n",
@@ -789,8 +778,7 @@
         "  Checkout the PyTorch website for a list of supported optimizers.\n",
         "  https://pytorch.org/docs/stable/optim.html\n",
         "  Try using the Adam optimizer to start.'''\n",
-        "optimizer = torch.optim.Adam(model.parameters(), lr=params[\"learning_rate\"])\n",
-        "# optimizer = # TODO\n",
+        "optimizer = # TODO\n",
         "\n",
         "def train_step(x, y):\n",
         "  # Set the model's mode to train\n",
@@ -801,22 +789,19 @@
         "\n",
         "  # Forward pass\n",
         "  '''TODO: feed the current input into the model and generate predictions'''\n",
-        "  y_hat = model(x) # TODO\n",
-        "  # y_hat = model('''TODO''')\n",
+        "  y_hat = model('''TODO''')\n",
         "\n",
         "  # Compute the loss\n",
         "  '''TODO: compute the loss!'''\n",
-        "  loss = compute_loss(y, y_hat) # TODO\n",
-        "  # loss = compute_loss('''TODO''', '''TODO''')\n",
+        "  loss = compute_loss('''TODO''', '''TODO''')\n",
         "\n",
         "  # Backward pass\n",
         "  '''TODO: complete the gradient computation and update step.\n",
         "    Remember that in PyTorch there are two steps to the training loop:\n",
         "    1. Backpropagate the loss\n",
         "    2. Update the model parameters using the optimizer\n",
         "  '''\n",
-        "  loss.backward() # TODO\n",
-        "  optimizer.step() # TODO\n",
+        "  '''TODO'''\n",
         "\n",
         "  return loss\n",
         "\n",
@@ -909,8 +894,7 @@
         "  # Evaluation step (generating ABC text using the learned RNN model)\n",
         "\n",
         "  '''TODO: convert the start string to numbers (vectorize)'''\n",
-        "  input_idx = [char2idx[s] for s in start_string] # TODO\n",
-        "  # input_idx = ['''TODO''']\n",
+        "  input_idx = ['''TODO'''] # TODO\n",
         "  input_idx = torch.tensor([input_idx], dtype=torch.long).to(device)\n",
         "\n",
         "  # Initialize the hidden state\n",
@@ -922,21 +906,17 @@
         "\n",
         "  for i in tqdm(range(generation_length)):\n",
         "    '''TODO: evaluate the inputs and generate the next character predictions'''\n",
-        "    predictions, state = model(input_idx, state, return_state=True)\n",
-        "    # predictions, hidden_state = model('''TODO''', '''TODO''', return_state=True)\n",
+        "    predictions, hidden_state = model('''TODO''', '''TODO''', return_state=True) # TODO\n",
         "\n",
         "    # Remove the batch dimension\n",
         "    predictions = predictions.squeeze(0)\n",
         "\n",
         "    '''TODO: use a multinomial distribution to sample over the probabilities'''\n",
-        "    input_idx = torch.multinomial(torch.softmax(predictions, dim=-1), num_samples=1)\n",
-        "    # input_idx = torch.multinomial('''TODO''', dim=-1), num_samples=1)\n",
+        "    input_idx = torch.multinomial('''TODO''', dim=-1), num_samples=1) # TODO\n",
         "\n",
         "    '''TODO: add the predicted character to the generated text!'''\n",
         "    # Hint: consider what format the prediction is in vs. the output\n",
-        "    text_generated.append(idx2char[input_idx].item()) # TODO\n",
-        "    # text_generated.append('''TODO''')\n",
-        "\n",
+        "    text_generated.append('''TODO''') # TODO\n",
         "\n",
         "  return (start_string + ''.join(text_generated))"
       ]
@@ -951,8 +931,7 @@
       "source": [
         "'''TODO: Use the model and the function defined above to generate ABC format text of length 1000!\n",
         "    As you may notice, ABC files start with \"X\" - this may be a good start string.'''\n",
-        "generated_text = generate_text(model, start_string=\"X\", generation_length=1000) # TODO\n",
-        "# generated_text = generate_text('''TODO''', '''TODO''', '''TODO''')"
+        "generated_text = generate_text('''TODO''', '''TODO''', '''TODO''') # TODO"
       ]
     },
     {