{ "cells": [ { "cell_type": "code", "execution_count": 2, "metadata": {}, "outputs": [], "source": [ "import gym\n", "import gym_wordle\n", "from stable_baselines3 import DQN\n", "import numpy as np" ] }, { "cell_type": "code", "execution_count": 3, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ ">\n" ] } ], "source": [ "env = gym.make(\"Wordle-v0\")\n", "done = False\n", "\n", "print(env)" ] }, { "cell_type": "code", "execution_count": 4, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "Using cuda device\n", "Wrapping the env with a `Monitor` wrapper\n", "Wrapping the env in a DummyVecEnv.\n" ] }, { "name": "stderr", "output_type": "stream", "text": [ "/usr/local/lib/python3.8/dist-packages/stable_baselines3/common/vec_env/patch_gym.py:49: UserWarning: You provided an OpenAI Gym environment. We strongly recommend transitioning to Gymnasium environments. Stable-Baselines3 is automatically wrapping your environments in a compatibility layer, which could potentially cause issues.\n", " warnings.warn(\n" ] }, { "name": "stdout", "output_type": "stream", "text": [ "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.977 |\n", "| time/ | |\n", "| episodes | 4 |\n", "| fps | 8958 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 24 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.954 |\n", "| time/ | |\n", "| episodes | 8 |\n", "| fps | 8537 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 48 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.932 |\n", "| time/ | |\n", "| episodes | 12 |\n", "| fps | 8965 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 72 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.909 |\n", "| time/ | |\n", "| episodes | 16 |\n", "| fps | 8875 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 96 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.886 |\n", "| time/ | |\n", "| episodes | 20 |\n", "| fps | 8931 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 120 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.863 |\n", "| time/ | |\n", "| episodes | 24 |\n", "| fps | 8943 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 144 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.84 |\n", "| time/ | |\n", "| episodes | 28 |\n", "| fps | 8995 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 168 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.818 |\n", "| time/ | |\n", "| episodes | 32 |\n", "| fps | 8822 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 192 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.795 |\n", "| time/ | |\n", "| episodes | 36 |\n", "| fps | 8734 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 216 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.772 |\n", "| time/ | |\n", "| episodes | 40 |\n", "| fps | 8772 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 240 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.749 |\n", "| time/ | |\n", "| episodes | 44 |\n", "| fps | 8660 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 264 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.726 |\n", "| time/ | |\n", "| episodes | 48 |\n", "| fps | 8697 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 288 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.704 |\n", "| time/ | |\n", "| episodes | 52 |\n", "| fps | 8782 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 312 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.681 |\n", "| time/ | |\n", "| episodes | 56 |\n", "| fps | 8786 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 336 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.658 |\n", "| time/ | |\n", "| episodes | 60 |\n", "| fps | 8760 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 360 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.635 |\n", "| time/ | |\n", "| episodes | 64 |\n", "| fps | 8767 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 384 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.612 |\n", "| time/ | |\n", "| episodes | 68 |\n", "| fps | 8729 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 408 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.59 |\n", "| time/ | |\n", "| episodes | 72 |\n", "| fps | 8763 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 432 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.567 |\n", "| time/ | |\n", "| episodes | 76 |\n", "| fps | 8797 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 456 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.544 |\n", "| time/ | |\n", "| episodes | 80 |\n", "| fps | 8811 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 480 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.521 |\n", "| time/ | |\n", "| episodes | 84 |\n", "| fps | 8844 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 504 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.498 |\n", "| time/ | |\n", "| episodes | 88 |\n", "| fps | 8904 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 528 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.476 |\n", "| time/ | |\n", "| episodes | 92 |\n", "| fps | 8922 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 552 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.453 |\n", "| time/ | |\n", "| episodes | 96 |\n", "| fps | 8864 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 576 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.43 |\n", "| time/ | |\n", "| episodes | 100 |\n", "| fps | 8907 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 600 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.407 |\n", "| time/ | |\n", "| episodes | 104 |\n", "| fps | 8938 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 624 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.384 |\n", "| time/ | |\n", "| episodes | 108 |\n", "| fps | 8922 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 648 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.362 |\n", "| time/ | |\n", "| episodes | 112 |\n", "| fps | 8943 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 672 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.339 |\n", "| time/ | |\n", "| episodes | 116 |\n", "| fps | 8921 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 696 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.316 |\n", "| time/ | |\n", "| episodes | 120 |\n", "| fps | 8934 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 720 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.293 |\n", "| time/ | |\n", "| episodes | 124 |\n", "| fps | 8927 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 744 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.27 |\n", "| time/ | |\n", "| episodes | 128 |\n", "| fps | 8967 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 768 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.248 |\n", "| time/ | |\n", "| episodes | 132 |\n", "| fps | 8958 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 792 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.225 |\n", "| time/ | |\n", "| episodes | 136 |\n", "| fps | 8983 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 816 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.202 |\n", "| time/ | |\n", "| episodes | 140 |\n", "| fps | 9002 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 840 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.179 |\n", "| time/ | |\n", "| episodes | 144 |\n", "| fps | 9000 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 864 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.156 |\n", "| time/ | |\n", "| episodes | 148 |\n", "| fps | 9017 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 888 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.134 |\n", "| time/ | |\n", "| episodes | 152 |\n", "| fps | 9002 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 912 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.111 |\n", "| time/ | |\n", "| episodes | 156 |\n", "| fps | 9015 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 936 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.088 |\n", "| time/ | |\n", "| episodes | 160 |\n", "| fps | 8997 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 960 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.0652 |\n", "| time/ | |\n", "| episodes | 164 |\n", "| fps | 9007 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 984 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 168 |\n", "| fps | 9039 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1008 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 172 |\n", "| fps | 9048 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1032 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 176 |\n", "| fps | 9014 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1056 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 180 |\n", "| fps | 8996 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1080 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 184 |\n", "| fps | 8945 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1104 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 188 |\n", "| fps | 8922 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1128 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 192 |\n", "| fps | 8902 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1152 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 196 |\n", "| fps | 8881 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1176 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 200 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1200 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 204 |\n", "| fps | 8818 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1224 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 208 |\n", "| fps | 8798 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1248 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 212 |\n", "| fps | 8775 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1272 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 216 |\n", "| fps | 8767 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1296 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 220 |\n", "| fps | 8756 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1320 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 224 |\n", "| fps | 8740 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1344 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 228 |\n", "| fps | 8729 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1368 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 232 |\n", "| fps | 8737 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1392 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 236 |\n", "| fps | 8737 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1416 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 240 |\n", "| fps | 8752 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1440 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 244 |\n", "| fps | 8768 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1464 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 248 |\n", "| fps | 8778 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1488 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 252 |\n", "| fps | 8780 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1512 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 256 |\n", "| fps | 8787 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1536 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 260 |\n", "| fps | 8805 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1560 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 264 |\n", "| fps | 8819 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1584 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 268 |\n", "| fps | 8820 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1608 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 272 |\n", "| fps | 8837 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1632 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 276 |\n", "| fps | 8850 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1656 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 280 |\n", "| fps | 8856 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1680 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 284 |\n", "| fps | 8853 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1704 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 288 |\n", "| fps | 8867 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1728 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 292 |\n", "| fps | 8872 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1752 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 296 |\n", "| fps | 8865 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1776 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 300 |\n", "| fps | 8851 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1800 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 304 |\n", "| fps | 8840 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1824 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 308 |\n", "| fps | 8831 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1848 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 312 |\n", "| fps | 8838 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1872 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 316 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1896 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 320 |\n", "| fps | 8833 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1920 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 324 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1944 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 328 |\n", "| fps | 8842 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1968 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 332 |\n", "| fps | 8855 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 1992 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 336 |\n", "| fps | 8866 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2016 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 340 |\n", "| fps | 8870 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2040 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 344 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2064 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 348 |\n", "| fps | 8876 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2088 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 352 |\n", "| fps | 8891 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2112 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 356 |\n", "| fps | 8894 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2136 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 360 |\n", "| fps | 8902 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2160 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 364 |\n", "| fps | 8906 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2184 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 368 |\n", "| fps | 8915 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2208 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 372 |\n", "| fps | 8918 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2232 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 376 |\n", "| fps | 8917 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2256 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 380 |\n", "| fps | 8932 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2280 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 384 |\n", "| fps | 8942 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2304 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 388 |\n", "| fps | 8945 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2328 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 392 |\n", "| fps | 8942 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2352 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 396 |\n", "| fps | 8939 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2376 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 400 |\n", "| fps | 8943 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2400 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 404 |\n", "| fps | 8935 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2424 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 408 |\n", "| fps | 8928 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2448 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 412 |\n", "| fps | 8929 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2472 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 416 |\n", "| fps | 8928 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2496 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 420 |\n", "| fps | 8929 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2520 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 424 |\n", "| fps | 8932 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2544 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 428 |\n", "| fps | 8936 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2568 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 432 |\n", "| fps | 8932 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2592 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 436 |\n", "| fps | 8936 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2616 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 440 |\n", "| fps | 8938 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2640 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 444 |\n", "| fps | 8941 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2664 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 448 |\n", "| fps | 8949 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2688 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 452 |\n", "| fps | 8952 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2712 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 456 |\n", "| fps | 8952 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2736 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 460 |\n", "| fps | 8954 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2760 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 464 |\n", "| fps | 8956 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2784 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 468 |\n", "| fps | 8962 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2808 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 472 |\n", "| fps | 8960 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2832 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 476 |\n", "| fps | 8955 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2856 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 480 |\n", "| fps | 8959 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2880 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 484 |\n", "| fps | 8961 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2904 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 488 |\n", "| fps | 8966 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2928 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 492 |\n", "| fps | 8966 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2952 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 496 |\n", "| fps | 8969 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 2976 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 500 |\n", "| fps | 8964 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3000 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 504 |\n", "| fps | 8962 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3024 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 508 |\n", "| fps | 8957 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3048 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 512 |\n", "| fps | 8954 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3072 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 516 |\n", "| fps | 8953 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3096 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 520 |\n", "| fps | 8932 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3120 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 524 |\n", "| fps | 8940 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3144 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 528 |\n", "| fps | 8937 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3168 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 532 |\n", "| fps | 8927 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3192 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 536 |\n", "| fps | 8915 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3216 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 540 |\n", "| fps | 8914 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3240 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 544 |\n", "| fps | 8909 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3264 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 548 |\n", "| fps | 8899 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3288 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 552 |\n", "| fps | 8886 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3312 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 556 |\n", "| fps | 8889 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3336 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 560 |\n", "| fps | 8790 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3360 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 564 |\n", "| fps | 8794 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3384 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 568 |\n", "| fps | 8798 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3408 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 572 |\n", "| fps | 8793 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3432 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 576 |\n", "| fps | 8796 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3456 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 580 |\n", "| fps | 8800 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3480 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 584 |\n", "| fps | 8805 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3504 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 588 |\n", "| fps | 8815 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3528 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 592 |\n", "| fps | 8814 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3552 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 596 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3576 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 600 |\n", "| fps | 8820 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3600 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 604 |\n", "| fps | 8824 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3624 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 608 |\n", "| fps | 8827 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3648 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 612 |\n", "| fps | 8821 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3672 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 616 |\n", "| fps | 8819 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3696 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 620 |\n", "| fps | 8809 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3720 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 624 |\n", "| fps | 8811 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3744 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 628 |\n", "| fps | 8809 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3768 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 632 |\n", "| fps | 8807 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3792 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 636 |\n", "| fps | 8813 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3816 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 640 |\n", "| fps | 8816 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3840 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 644 |\n", "| fps | 8806 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3864 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 648 |\n", "| fps | 8802 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3888 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 652 |\n", "| fps | 8807 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3912 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 656 |\n", "| fps | 8810 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3936 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 660 |\n", "| fps | 8813 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3960 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 664 |\n", "| fps | 8813 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 3984 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 668 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4008 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 672 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4032 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 676 |\n", "| fps | 8821 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4056 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 680 |\n", "| fps | 8822 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4080 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 684 |\n", "| fps | 8824 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4104 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 688 |\n", "| fps | 8826 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4128 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 692 |\n", "| fps | 8828 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4152 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 696 |\n", "| fps | 8822 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4176 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 700 |\n", "| fps | 8820 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4200 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 704 |\n", "| fps | 8822 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4224 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 708 |\n", "| fps | 8824 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4248 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 712 |\n", "| fps | 8826 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4272 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 716 |\n", "| fps | 8829 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4296 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 720 |\n", "| fps | 8825 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4320 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 724 |\n", "| fps | 8823 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4344 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 728 |\n", "| fps | 8827 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4368 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 732 |\n", "| fps | 8831 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4392 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 736 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4416 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 740 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4440 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 744 |\n", "| fps | 8832 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4464 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 748 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4488 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 752 |\n", "| fps | 8841 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4512 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 756 |\n", "| fps | 8839 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4536 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 760 |\n", "| fps | 8842 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4560 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 764 |\n", "| fps | 8845 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4584 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 768 |\n", "| fps | 8848 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4608 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 772 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4632 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 776 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4656 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 780 |\n", "| fps | 8852 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4680 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 784 |\n", "| fps | 8854 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4704 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 788 |\n", "| fps | 8854 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4728 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 792 |\n", "| fps | 8857 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4752 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 796 |\n", "| fps | 8857 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4776 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 800 |\n", "| fps | 8861 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4800 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 804 |\n", "| fps | 8862 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4824 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 808 |\n", "| fps | 8862 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4848 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 812 |\n", "| fps | 8867 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4872 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 816 |\n", "| fps | 8869 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4896 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 820 |\n", "| fps | 8863 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4920 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 824 |\n", "| fps | 8868 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4944 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 828 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4968 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 832 |\n", "| fps | 8875 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 4992 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 836 |\n", "| fps | 8877 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5016 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 840 |\n", "| fps | 8875 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5040 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 844 |\n", "| fps | 8869 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5064 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 848 |\n", "| fps | 8838 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5088 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 852 |\n", "| fps | 8819 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5112 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 856 |\n", "| fps | 8818 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5136 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 860 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5160 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 864 |\n", "| fps | 8813 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5184 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 868 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5208 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 872 |\n", "| fps | 8812 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5232 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 876 |\n", "| fps | 8816 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5256 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 880 |\n", "| fps | 8821 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5280 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 884 |\n", "| fps | 8824 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5304 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 888 |\n", "| fps | 8825 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5328 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 892 |\n", "| fps | 8826 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5352 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 896 |\n", "| fps | 8832 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5376 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 900 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5400 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 904 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5424 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 908 |\n", "| fps | 8842 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5448 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 912 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5472 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 916 |\n", "| fps | 8850 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5496 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 920 |\n", "| fps | 8853 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5520 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 924 |\n", "| fps | 8843 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5544 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 928 |\n", "| fps | 8837 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5568 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 932 |\n", "| fps | 8823 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5592 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 936 |\n", "| fps | 8806 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5616 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 940 |\n", "| fps | 8796 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5640 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 944 |\n", "| fps | 8798 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5664 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 948 |\n", "| fps | 8791 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5688 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 952 |\n", "| fps | 8787 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5712 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 956 |\n", "| fps | 8788 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5736 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 960 |\n", "| fps | 8783 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5760 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 964 |\n", "| fps | 8782 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5784 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 968 |\n", "| fps | 8782 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5808 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 972 |\n", "| fps | 8787 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5832 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 976 |\n", "| fps | 8789 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5856 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 980 |\n", "| fps | 8787 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5880 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 984 |\n", "| fps | 8789 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5904 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 988 |\n", "| fps | 8792 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5928 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 992 |\n", "| fps | 8795 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5952 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 996 |\n", "| fps | 8798 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 5976 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1000 |\n", "| fps | 8801 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6000 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1004 |\n", "| fps | 8802 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6024 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1008 |\n", "| fps | 8805 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6048 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1012 |\n", "| fps | 8803 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6072 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1016 |\n", "| fps | 8807 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6096 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1020 |\n", "| fps | 8808 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6120 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1024 |\n", "| fps | 8812 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6144 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1028 |\n", "| fps | 8817 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6168 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1032 |\n", "| fps | 8819 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6192 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1036 |\n", "| fps | 8820 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6216 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1040 |\n", "| fps | 8820 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6240 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1044 |\n", "| fps | 8822 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6264 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1048 |\n", "| fps | 8825 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6288 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1052 |\n", "| fps | 8827 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6312 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1056 |\n", "| fps | 8826 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6336 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1060 |\n", "| fps | 8828 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6360 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1064 |\n", "| fps | 8828 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6384 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1068 |\n", "| fps | 8832 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6408 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1072 |\n", "| fps | 8833 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6432 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1076 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6456 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1080 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6480 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1084 |\n", "| fps | 8837 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6504 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1088 |\n", "| fps | 8840 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6528 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1092 |\n", "| fps | 8842 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6552 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1096 |\n", "| fps | 8845 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6576 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1100 |\n", "| fps | 8843 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6600 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1104 |\n", "| fps | 8841 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6624 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1108 |\n", "| fps | 8844 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6648 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1112 |\n", "| fps | 8848 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6672 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1116 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6696 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1120 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6720 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1124 |\n", "| fps | 8849 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6744 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1128 |\n", "| fps | 8852 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6768 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1132 |\n", "| fps | 8856 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6792 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1136 |\n", "| fps | 8858 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6816 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1140 |\n", "| fps | 8862 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6840 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1144 |\n", "| fps | 8864 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6864 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1148 |\n", "| fps | 8863 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6888 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1152 |\n", "| fps | 8867 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6912 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1156 |\n", "| fps | 8870 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6936 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1160 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6960 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1164 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 6984 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1168 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7008 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1172 |\n", "| fps | 8872 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7032 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1176 |\n", "| fps | 8874 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7056 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1180 |\n", "| fps | 8870 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7080 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1184 |\n", "| fps | 8871 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7104 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1188 |\n", "| fps | 8870 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7128 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1192 |\n", "| fps | 8872 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7152 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1196 |\n", "| fps | 8873 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7176 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1200 |\n", "| fps | 8876 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7200 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1204 |\n", "| fps | 8879 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7224 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1208 |\n", "| fps | 8882 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7248 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1212 |\n", "| fps | 8881 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7272 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1216 |\n", "| fps | 8882 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7296 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1220 |\n", "| fps | 8881 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7320 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1224 |\n", "| fps | 8880 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7344 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1228 |\n", "| fps | 8883 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7368 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1232 |\n", "| fps | 8885 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7392 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1236 |\n", "| fps | 8888 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7416 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1240 |\n", "| fps | 8886 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7440 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1244 |\n", "| fps | 8887 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7464 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1248 |\n", "| fps | 8887 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7488 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1252 |\n", "| fps | 8887 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7512 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1256 |\n", "| fps | 8890 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7536 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1260 |\n", "| fps | 8887 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7560 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1264 |\n", "| fps | 8888 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7584 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1268 |\n", "| fps | 8890 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7608 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1272 |\n", "| fps | 8886 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7632 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1276 |\n", "| fps | 8889 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7656 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1280 |\n", "| fps | 8892 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7680 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1284 |\n", "| fps | 8892 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7704 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1288 |\n", "| fps | 8890 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7728 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1292 |\n", "| fps | 8888 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7752 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1296 |\n", "| fps | 8890 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7776 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1300 |\n", "| fps | 8894 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7800 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1304 |\n", "| fps | 8895 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7824 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1308 |\n", "| fps | 8898 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7848 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1312 |\n", "| fps | 8901 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7872 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1316 |\n", "| fps | 8901 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7896 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1320 |\n", "| fps | 8901 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7920 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1324 |\n", "| fps | 8901 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7944 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1328 |\n", "| fps | 8900 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7968 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1332 |\n", "| fps | 8903 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 7992 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1336 |\n", "| fps | 8906 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8016 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1340 |\n", "| fps | 8909 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8040 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1344 |\n", "| fps | 8909 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8064 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1348 |\n", "| fps | 8906 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8088 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1352 |\n", "| fps | 8906 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8112 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1356 |\n", "| fps | 8904 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8136 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1360 |\n", "| fps | 8904 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8160 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1364 |\n", "| fps | 8897 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8184 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1368 |\n", "| fps | 8880 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8208 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1372 |\n", "| fps | 8864 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8232 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1376 |\n", "| fps | 8849 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8256 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1380 |\n", "| fps | 8847 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8280 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1384 |\n", "| fps | 8845 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8304 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1388 |\n", "| fps | 8844 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8328 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1392 |\n", "| fps | 8842 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8352 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1396 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8376 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1400 |\n", "| fps | 8834 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8400 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1404 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8424 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1408 |\n", "| fps | 8834 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8448 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1412 |\n", "| fps | 8835 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8472 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1416 |\n", "| fps | 8836 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8496 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1420 |\n", "| fps | 8837 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8520 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1424 |\n", "| fps | 8839 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8544 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1428 |\n", "| fps | 8843 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8568 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1432 |\n", "| fps | 8844 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8592 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1436 |\n", "| fps | 8848 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8616 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1440 |\n", "| fps | 8850 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8640 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1444 |\n", "| fps | 8852 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8664 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1448 |\n", "| fps | 8853 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8688 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1452 |\n", "| fps | 8852 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8712 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1456 |\n", "| fps | 8851 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8736 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1460 |\n", "| fps | 8855 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8760 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1464 |\n", "| fps | 8854 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8784 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1468 |\n", "| fps | 8854 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8808 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1472 |\n", "| fps | 8856 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8832 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1476 |\n", "| fps | 8858 |\n", "| time_elapsed | 0 |\n", "| total_timesteps | 8856 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1480 |\n", "| fps | 8857 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 8880 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1484 |\n", "| fps | 8860 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 8904 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1488 |\n", "| fps | 8860 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 8928 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1492 |\n", "| fps | 8859 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 8952 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1496 |\n", "| fps | 8858 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 8976 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1500 |\n", "| fps | 8861 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9000 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1504 |\n", "| fps | 8863 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9024 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1508 |\n", "| fps | 8865 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9048 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1512 |\n", "| fps | 8865 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9072 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1516 |\n", "| fps | 8864 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9096 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1520 |\n", "| fps | 8866 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9120 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1524 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9144 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1528 |\n", "| fps | 8866 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9168 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1532 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9192 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1536 |\n", "| fps | 8871 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9216 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1540 |\n", "| fps | 8869 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9240 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1544 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9264 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1548 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9288 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1552 |\n", "| fps | 8872 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9312 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1556 |\n", "| fps | 8869 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9336 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1560 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9360 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1564 |\n", "| fps | 8871 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9384 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1568 |\n", "| fps | 8873 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9408 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1572 |\n", "| fps | 8871 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9432 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1576 |\n", "| fps | 8871 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9456 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1580 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9480 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1584 |\n", "| fps | 8871 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9504 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1588 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9528 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1592 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9552 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1596 |\n", "| fps | 8873 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9576 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1600 |\n", "| fps | 8874 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9600 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1604 |\n", "| fps | 8874 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9624 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1608 |\n", "| fps | 8875 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9648 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1612 |\n", "| fps | 8875 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9672 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1616 |\n", "| fps | 8873 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9696 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1620 |\n", "| fps | 8873 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9720 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1624 |\n", "| fps | 8868 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9744 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1628 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9768 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1632 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9792 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1636 |\n", "| fps | 8866 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9816 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1640 |\n", "| fps | 8867 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9840 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1644 |\n", "| fps | 8869 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9864 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1648 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9888 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1652 |\n", "| fps | 8870 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9912 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1656 |\n", "| fps | 8858 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9936 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1660 |\n", "| fps | 8845 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9960 |\n", "----------------------------------\n", "----------------------------------\n", "| rollout/ | |\n", "| ep_len_mean | 6 |\n", "| ep_rew_mean | -6 |\n", "| exploration_rate | 0.05 |\n", "| time/ | |\n", "| episodes | 1664 |\n", "| fps | 8831 |\n", "| time_elapsed | 1 |\n", "| total_timesteps | 9984 |\n", "----------------------------------\n" ] }, { "data": { "text/plain": [ "" ] }, "execution_count": 4, "metadata": {}, "output_type": "execute_result" } ], "source": [ "model = DQN(\"MlpPolicy\", env, verbose=1)\n", "model.learn(total_timesteps=10000)" ] }, { "cell_type": "code", "execution_count": 15, "metadata": {}, "outputs": [], "source": [ "def test(model):\n", "\n", " end_rewards = []\n", "\n", " for i in range(1000):\n", " \n", " state = env.reset()\n", "\n", " done = False\n", "\n", " while not done:\n", "\n", " action, _states = model.predict(state, deterministic=True)\n", "\n", " state, reward, done, info = env.step(action)\n", "\n", " end_rewards.append(reward == 0)\n", " if (reward == 0):\n", " print(state)\n", "\n", " return np.sum(end_rewards) / len(end_rewards)" ] }, { "cell_type": "code", "execution_count": 17, "metadata": {}, "outputs": [ { "name": "stdout", "output_type": "stream", "text": [ "[[1 3 3 3 1 0 0 0 0 0]\n", " [1 1 1 1 1 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]]\n", "[[1 3 3 3 1 0 0 0 0 0]\n", " [1 1 1 1 1 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]\n", " [0 0 0 0 0 0 0 0 0 0]]\n", "0.002\n" ] } ], "source": [ "print(test(model))\n", "model.save(\"dqn_wordle\")" ] }, { "cell_type": "code", "execution_count": null, "metadata": {}, "outputs": [], "source": [] } ], "metadata": { "kernelspec": { "display_name": "Python 3 (ipykernel)", "language": "python", "name": "python3" }, "language_info": { "codemirror_mode": { "name": "ipython", "version": 3 }, "file_extension": ".py", "mimetype": "text/x-python", "name": "python", "nbconvert_exporter": "python", "pygments_lexer": "ipython3", "version": "3.8.10" } }, "nbformat": 4, "nbformat_minor": 2 }