|
89 | 89 | "id": "EvdePP-VyVWp" |
90 | 90 | }, |
91 | 91 | "source": [ |
| 92 | + "#Install some dependencies for visualizing the agents\n", |
| 93 | + "!apt-get install -y xvfb python-opengl x11-utils > /dev/null 2>&1\n", |
| 94 | + "!pip install gym pyvirtualdisplay scikit-video > /dev/null 2>&1\n", |
| 95 | + "\n", |
92 | 96 | "# Import Tensorflow 2.0\n", |
93 | 97 | "%tensorflow_version 2.x\n", |
94 | 98 | "import tensorflow as tf\n", |
|
241 | 245 | "\n", |
242 | 246 | "cartpole_model = create_cartpole_model()" |
243 | 247 | ], |
244 | | - "execution_count": null, |
| 248 | + "execution_count": 6, |
245 | 249 | "outputs": [] |
246 | 250 | }, |
247 | 251 | { |
|
289 | 293 | "\n", |
290 | 294 | " return action[0] if single else action" |
291 | 295 | ], |
292 | | - "execution_count": null, |
| 296 | + "execution_count": 7, |
293 | 297 | "outputs": [] |
294 | 298 | }, |
295 | 299 | { |
|
352 | 356 | "# Instantiate a single Memory buffer\n", |
353 | 357 | "memory = Memory()" |
354 | 358 | ], |
355 | | - "execution_count": null, |
| 359 | + "execution_count": 8, |
356 | 360 | "outputs": [] |
357 | 361 | }, |
358 | 362 | { |
|
404 | 408 | " \n", |
405 | 409 | " return normalize(discounted_rewards)" |
406 | 410 | ], |
407 | | - "execution_count": null, |
| 411 | + "execution_count": 9, |
408 | 412 | "outputs": [] |
409 | 413 | }, |
410 | 414 | { |
|
448 | 452 | " # loss = tf.reduce_mean('''TODO''')\n", |
449 | 453 | " return loss" |
450 | 454 | ], |
451 | | - "execution_count": null, |
| 455 | + "execution_count": 10, |
452 | 456 | "outputs": [] |
453 | 457 | }, |
454 | 458 | { |
|
482 | 486 | " # grads = tape.gradient('''TODO''', model.trainable_variables)\n", |
483 | 487 | " optimizer.apply_gradients(zip(grads, model.trainable_variables))\n" |
484 | 488 | ], |
485 | | - "execution_count": null, |
| 489 | + "execution_count": 11, |
486 | 490 | "outputs": [] |
487 | 491 | }, |
488 | 492 | { |
|
0 commit comments