Update gymnasium code to v1.0.0

93eb47d5 · Christof Kaufmann · 91c1fa0f · 93eb47d5
Commit 93eb47d5 authored 4 months ago by Christof Kaufmann
--- a/gym-graphic-output.ipynb
+++ b/gym-graphic-output.ipynb
@@ -16,7 +16,7 @@
  },
  {
   "cell_type": "code",
-   "execution_count": 8,
+   "execution_count": null,
   "id": "b425cecc-4212-434f-b57c-a9292c5a08d1",
   "metadata": {
    "tags": []
@@ -24,11 +24,12 @@
   "outputs": [],
   "source": [
    "import gymnasium as gym\n",
+    "import ale_py  # noqa # pylint: disable=unused-import\n",
    "\n",
-    "# env = gym.make(\"Pong-v4\", render_mode=\"rgb_array\")\n",
+    "# env = gym.make(\"ALE/Pong-v5\", render_mode=\"rgb_array\")\n",
    "# env.metadata['render_fps'] = 30\n",
    "\n",
-    "env = gym.make(\"LunarLander-v2\", render_mode=\"rgb_array\")\n",
+    "env = gym.make(\"LunarLander-v3\", render_mode=\"rgb_array\")\n",
    "\n",
    "env = gym.wrappers.RecordVideo(env, './video/', disable_logger=True,\n",
    "                               episode_trigger=lambda episode_id: episode_id % 5 == 0) # every 5th episode\n",
@@ -61,18 +62,18 @@
   "outputs": [],
   "source": [
    "import gymnasium as gym\n",
+    "import ale_py  # noqa # pylint: disable=unused-import\n",
    "import PIL.Image\n",
    "import os\n",
    "\n",
-    "# env = gym.make(\"Pong-v4\", render_mode=\"rgb_array\")\n",
+    "# env = gym.make(\"ALE/Pong-v5\", render_mode=\"rgb_array_list\")\n",
    "# env.metadata['render_fps'] = 30\n",
    "\n",
    "env = gym.make(\"CartPole-v1\", render_mode=\"rgb_array_list\")\n",
    "\n",
    "def save_gif(frames, filename='gym.gif'):\n",
    "    directory = os.path.dirname(filename)\n",
-    "    if not os.path.exists(directory):\n",
+    "    os.makedirs(directory, exist_ok=True)\n",
-    "        os.makedirs(directory)\n",
    "\n",
    "    images = [PIL.Image.fromarray(frame) for frame in frames]\n",
    "    images[0].save(filename, format='GIF', append_images=images[1:],\n",
@@ -111,11 +112,12 @@
   "outputs": [],
   "source": [
    "import gymnasium as gym\n",
+    "import ale_py  # noqa # pylint: disable=unused-import\n",
    "import matplotlib.pyplot as plt\n",
    "# you maybe have to restart your kernel, if you changed the matplotlib backend before\n",
    "%matplotlib widget\n",
    "\n",
-    "env = gym.make(\"LunarLander-v2\", render_mode=\"rgb_array\")\n",
+    "env = gym.make(\"LunarLander-v3\", render_mode=\"rgb_array\")\n",
    "observation, info = env.reset() # is required once before calling env.render()\n",
    "img = plt.imshow(env.render()) # only call this once to bring up the plot\n",
    "plt.show()\n",

 %% Cell type:markdown id:cb5980cf-bb11-477c-975d-c555dbd61e22 tags:
 # Graphic Output of Gymnasium Environments
 Although values are probably better to monitor, when you got some experience, in the beginning, for debugging and for presentations you like to watch your agent playing games. Depending on the IDE there are partially different ways to do it.
 ## Recording Videos
 The best solution is probably to make periodic videos. In this way, you can look at the capabilities at different learning states and you can rewatch it later on. In JupyterLab right-click on a video and select *Open in New Browser Tab*.
 %% Cell type:code id:b425cecc-4212-434f-b57c-a9292c5a08d1 tags:
 ``` python
 import gymnasium as gym
+import ale_py  # noqa # pylint: disable=unused-import
-# env = gym.make("Pong-v4", render_mode="rgb_array")
+# env = gym.make("ALE/Pong-v5", render_mode="rgb_array")
 # env.metadata['render_fps'] = 30
-env = gym.make("LunarLander-v2", render_mode="rgb_array")
+env = gym.make("LunarLander-v3", render_mode="rgb_array")
 env = gym.wrappers.RecordVideo(env, './video/', disable_logger=True,
                               episode_trigger=lambda episode_id: episode_id % 5 == 0) # every 5th episode
 observation, info = env.reset()
 for _ in range(1000):
    action = env.action_space.sample()
    observation, reward, terminated, truncated, info = env.step(action)
    if terminated or truncated:
        observation, info = env.reset()
 env.close()
 ```
 %% Cell type:markdown id:f95a4861 tags:
 ## Making GIFs
 GIFs are fun and easy to make and look at. Here is a way to make them after every episode.
 %% Cell type:code id:4e2994b5 tags:
 ``` python
 import gymnasium as gym
+import ale_py  # noqa # pylint: disable=unused-import
 import PIL.Image
 import os
-# env = gym.make("Pong-v4", render_mode="rgb_array")
+# env = gym.make("ALE/Pong-v5", render_mode="rgb_array_list")
 # env.metadata['render_fps'] = 30
 env = gym.make("CartPole-v1", render_mode="rgb_array_list")
 def save_gif(frames, filename='gym.gif'):
    directory = os.path.dirname(filename)
-    if not os.path.exists(directory):
+    os.makedirs(directory, exist_ok=True)
-        os.makedirs(directory)
    images = [PIL.Image.fromarray(frame) for frame in frames]
    images[0].save(filename, format='GIF', append_images=images[1:],
                   save_all=True, duration=30, loop=0)
 observation, info = env.reset()
 gif_count = 0
 for _ in range(1000):
    action = env.action_space.sample()
    observation, reward, terminated, truncated, info = env.step(action)
    if terminated or truncated:
        # save gif for every episode
        save_gif(env.render(), f'gifs/gym-{gif_count:04}.gif')
        gif_count += 1
        observation, info = env.reset()
 env.close()
 ```
 %% Cell type:markdown id:9f7a4b36-5204-4783-9b6e-55eb3568b591 tags:
 ## Live View using Matplotlib
 You can also watch the game live during training, maybe every few episodes or so. For that, choose `render_mode="rgb_array"` and make a first `imshow` plot. *Very important: The cell has to end after making the plot, because the plot will only be visible when the cell finishes.* In the second cell the plot gets updated.
 %% Cell type:code id:17be9d89-1246-4cd7-9258-49cff9ee6da9 tags:
 ``` python
 import gymnasium as gym
+import ale_py  # noqa # pylint: disable=unused-import
 import matplotlib.pyplot as plt
 # you maybe have to restart your kernel, if you changed the matplotlib backend before
 %matplotlib widget
-env = gym.make("LunarLander-v2", render_mode="rgb_array")
+env = gym.make("LunarLander-v3", render_mode="rgb_array")
 observation, info = env.reset() # is required once before calling env.render()
 img = plt.imshow(env.render()) # only call this once to bring up the plot
 plt.show()
 # IMPORTANT: Split your code at this point into two cells, so the plot can be drawn
 ```
 %% Cell type:code id:fe77c845-f5b0-4462-a4e6-c2b5c7fd71cf tags:
 ``` python
 observation, info = env.reset()
 for _ in range(150):
    action = env.action_space.sample()
    observation, reward, terminated, truncated, info = env.step(action)
    if terminated or truncated:
        observation, info = env.reset()
    # update plot
    img.set_data(env.render())
    plt.gcf().canvas.draw()
 env.close()
 print('done.')
 ```